diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/alpaca_converter.py" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/alpaca_converter.py" new file mode 100644 index 00000000..194ff20f --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/alpaca_converter.py" @@ -0,0 +1,79 @@ +""" +fastchat stanford alpaca data convert tools. +""" + +import argparse + +import json + +import pathlib + +# Prompt from stanford alpaca's training script + +PROMPT_DICT = { + "prompt_input": ( + "Below is an instruction that describes a task, paired with an input that provides further context. " + "Write a response that appropriately completes the request.\n\n" + "### Instruction:\n{instruction}\n\n### Input:\n{input}\n\n### Response:" + ), + + "prompt_no_input": ( + "Below is an instruction that describes a task. " + "Write a response that appropriately completes the request.\n\n" + "### Instruction:\n{instruction}\n\n### Response:" + ), + +} + +def main(args_param): + data_path = pathlib.Path(args_param.data_path) + with data_path.open() as f: + data = json.load(f) + prompt_input, prompt_no_input = ( + PROMPT_DICT["prompt_input"], + PROMPT_DICT["prompt_no_input"], + ) + + sources = [ + prompt_input.format_map(example) + if example.get("input", "") != "" + else prompt_no_input.format_map(example) + for example in data + ] + + targets = [example["output"] for example in data] + + new_data = [] + + cnt = 1 + + for s, t in zip(sources, targets): + new_data.append( + { + "id": str(cnt), + "conversations": [ + { + "from": "human", + "value": s, + }, + { + "from": "gpt", + "value": t, + }, + ], + } + ) + + cnt += 1 + + json.dump(new_data, open(args_param.output_path, "w"), ensure_ascii=False, indent=2) + +if __name__ == "__main__": + + parser = argparse.ArgumentParser() + parser.add_argument("--data_path", type=str, default="alpaca-data.json") + parser.add_argument( + "--output_path", type=str, default="alpaca-data-conversation.json" + ) + args = parser.parse_args() + main(args) diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/llama_preprocess.py" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/llama_preprocess.py" new file mode 100644 index 00000000..f0b35396 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\225\260\346\215\256\351\233\206\345\244\204\347\220\206/llama_preprocess.py" @@ -0,0 +1,289 @@ +# Copyright 2023 Huawei Technologies Co., Ltd +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================ + +""" +transform wikitext-2, wikitext-103, lambada, openwebtext dataset to mindrecord. +""" +import argparse +import json +import os +import re +import numpy as np + +from mindspore.mindrecord import FileWriter +from mindformers.dataset.dataloader.training_dataloader import TrainingDataset +from mindformers.models.llama.llama_tokenizer import LlamaTokenizer + +from conversation import get_default_conv_template + +IGNORE_TOKEN_ID = -100 + + +def chunks(lst, n): + """ yield n sized chunks from list""" + for i in range(0, len(lst), n): + yield lst[i:i+n] + + +def package_file(it, n): + """ package multiple files""" + stop = False + while not stop: + batch = [] + for _ in range(n): + try: + batch.append(next(it)) + except StopIteration: + stop = True + if not batch: + break + yield batch + + +def clean_wikitext(string): + """ cleaning wikitext dataset""" + # contractions + string = string.replace("s '", "s'") + string = re.sub(r"/' [0-9]/", r"/'[0-9]/", string) + # number separators + string = string.replace(" @-@ ", "-") + string = string.replace(" @,@ ", ",") + string = string.replace(" @.@ ", ".") + # punctuation + string = string.replace(" : ", ": ") + string = string.replace(" ; ", "; ") + string = string.replace(" . ", ". ") + string = string.replace(" ! ", "! ") + string = string.replace(" ? ", "? ") + string = string.replace(" , ", ", ") + # double brackets + string = re.sub(r"\(\s*([^\)]*?)\s*\)", r"(\1)", string) + string = re.sub(r"\[\s*([^\]]*?)\s*\]", r"[\1]", string) + string = re.sub(r"{\s*([^}]*?)\s*}", r"{\1}", string) + string = re.sub(r"\"\s*([^\"]*?)\s*\"", r'"\1"', string) + string = re.sub(r"'\s*([^']*?)\s*'", r"'\1'", string) + # miscellaneous + string = string.replace("= = = =", "====") + string = string.replace("= = =", "===") + string = string.replace("= =", "==") + string = string.replace(" "+chr(176)+" ", chr(176)) + string = string.replace(" \n", "\n") + string = string.replace("\n ", "\n") + string = string.replace(" N ", " 1 ") + string = string.replace(" 's", "'s") + return string + + +def preprocess(sources, tokenizer, seq_length): + """conversation preprocess.""" + conv = get_default_conv_template("vicuna").copy() + roles = {"human": conv.roles[0], "gpt": conv.roles[1]} + + # Apply prompt templates + conversations = [] + for i, source in enumerate(sources): + if roles[source[0]["from"]] != conv.roles[0]: + # Skip the first one if it is not from human + source = source[1:] + + conv.messages = [] + for j, sentence in enumerate(source): + role = roles[sentence["from"]] + assert role == conv.roles[j % 2], f"{i}" + conv.append_message(role, sentence["value"]) + conversations.append(conv.get_prompt()) + + sep = conv.sep + conv.roles[1] + ": " + # Tokenize conversations + input_ids = [] + targets = [] + # attention_mask = [] + for conversation in conversations: + rounds = conversation.split(conv.sep2) + ids = [tokenizer.bos_token_id] + mask = [1] + for i, rou in enumerate(rounds): + if rou == "": + break + conv_out = tokenizer(rou) + ids.extend(conv_out['input_ids'][1:]) + mask.extend(conv_out['attention_mask'][1:]) + d = {'input_ids': ids, 'attention_mask': mask} + # pylint: disable=W0212 + d = tokenizer._pad(d, max_length=seq_length, padding_strategy='max_length') + input_ids.append(d['input_ids'][:seq_length]) + # attention_mask.append(d['attention_mask']) + + target = np.array(d['input_ids']) + total_len = int(np.not_equal(target, tokenizer.pad_token_id).sum()) + cur_len = 1 + target[:cur_len] = IGNORE_TOKEN_ID + for i, rou in enumerate(rounds): + if rou == "": + break + parts = rou.split(sep) + if len(parts) != 2: + break + parts[0] += sep + round_len = len(tokenizer(rou)['input_ids']) - 1 + instruction_len = len(tokenizer(parts[0])['input_ids']) - 3 + + target[cur_len : cur_len + instruction_len] = IGNORE_TOKEN_ID + + cur_len += round_len + target[cur_len:] = IGNORE_TOKEN_ID + + if cur_len < seq_length: + if cur_len != total_len: + target[:] = IGNORE_TOKEN_ID + else: + target = target[:seq_length] + targets.append(target.tolist()) + + input_ids = np.array(input_ids, dtype=np.int32) + targets = np.array(targets, dtype=np.int32) + + return dict( + input_ids=input_ids, + labels=targets, + ) + + +class SupervisedDataset: + """Dataset for supervised fine-tuning.""" + + def __init__(self, raw_data, tokenizer, seq_length): + super(SupervisedDataset, self).__init__() + + sources = [example["conversations"] for example in raw_data] + data_dict = preprocess(sources, tokenizer, seq_length) + + self.input_ids = data_dict["input_ids"] + self.labels = data_dict["labels"] + + def __len__(self): + return len(self.input_ids) + + def __getitem__(self, i): + return dict( + input_ids=self.input_ids[i], + labels=self.labels[i] + ) + + +def tokenize_wiki(tokenizer, file_path, seq_length, repeat): + """tokenize wikitext-2/wikitext-103 dataset""" + content = [] + with open(file_path, 'r', encoding='utf-8') as f: + for para in clean_wikitext(f.read()).split("\n\n"): + if para and para.strip().startswith('=') is False: + content += tokenizer(para)['input_ids'] + content_out = [] + for _ in range(repeat): + content_out.extend(content) + content = content_out + for chunk in chunks(content, seq_length): + sample = {} + if len(chunk) == seq_length: + sample['input_ids'] = np.array(chunk, dtype=np.int32) + yield sample + + +def tokenize_wikipedia(tokenizer, dataset_dir, seq_length, samples_num): + """tokenize wikipedia dataset with parquet format""" + dataset = TrainingDataset(dataset_dir=dataset_dir, + column_names=["input_ids"], + max_length=seq_length, + file_format="parquet", + tokenizer=tokenizer, + is_align=True, + samples_num=samples_num, + shuffle=False) + for data in dataset: + input_id_list = data[0] + if len(input_id_list) == seq_length: + sample = { + 'input_ids': np.array(input_id_list, dtype=np.int32) + } + yield sample + + +def tokenize_qa(tokenizer, file_path, seq_length): + raw_data = json.load(open(file_path, "r")) + dataset_cls = SupervisedDataset(raw_data, tokenizer, seq_length) + for i in range(len(dataset_cls)): + yield dataset_cls[i] + + +if __name__ == '__main__': + parser = argparse.ArgumentParser() + parser.add_argument('--dataset_type', type=str, default='wiki') + parser.add_argument('--input_glob', type=str, default='/mnt/luolan/wikitext-2/wiki.train.tokens') + parser.add_argument('--output_file', type=str, default='./dataset/wiki2048/wiki2048') + parser.add_argument('--tokenizer', type=str, default='llama', choices=['llama']) + parser.add_argument('--model_file', type=str, default='/mnt/luolan/llama/tokenizer.model') + parser.add_argument('--file_partition', type=int, default=1) + parser.add_argument('--repeat', type=int, default=1) + parser.add_argument('--samples_num', type=int, default=10000) + parser.add_argument('--seq_length', type=int, default=2048) + args = parser.parse_args() + + out_dir, out_file = os.path.split(os.path.abspath(args.output_file)) + if not os.path.exists(out_dir): + os.mkdir(out_dir) + if args.dataset_type == 'wiki': + schema = {'input_ids': {"type": "int32", "shape": [-1]},} + if args.dataset_type == 'wikipedia': + schema = {'input_ids': {"type": "int32", "shape": [-1]},} + elif args.dataset_type == 'qa': + schema = {'input_ids': {"type": "int32", "shape": [-1]}, 'labels': {"type": "int32", "shape": [-1]}} + writer = FileWriter(file_name=args.output_file, + shard_num=args.file_partition) + writer.add_schema(schema, args.dataset_type) + + # Start to load tokenizer + if not os.path.exists(args.model_file): + raise FileNotFoundError(f"file {args.model_file} do not exists.") + + transforms_count = 0 + word_tokenizer = LlamaTokenizer(vocab_file=args.model_file) + if hasattr(word_tokenizer, 'add_bos_token'): + word_tokenizer.add_bos_token = True + if hasattr(word_tokenizer, 'add_eos_token'): + word_tokenizer.add_eos_token = True + if args.dataset_type == 'wiki': + for x in tokenize_wiki(word_tokenizer, args.input_glob, args.seq_length + 1, args.repeat): + transforms_count += 1 + writer.write_raw_data([x]) + print("Transformed {} records.".format(transforms_count)) + elif args.dataset_type == 'wikipedia': + for x in tokenize_wikipedia(word_tokenizer, args.input_glob, args.seq_length + 1, samples_num=args.samples_num): + transforms_count += 1 + writer.write_raw_data([x]) + print("Transformed {} records.".format(transforms_count)) + elif args.dataset_type == 'qa': + for x in tokenize_qa(word_tokenizer, args.input_glob, args.seq_length + 1): + transforms_count += 1 + writer.write_raw_data([x]) + print("Transformed {} records.".format(transforms_count)) + else: + raise ValueError( + "Not support dataset type: {}".format(args.dataset_type)) + + writer.commit() + out_file = args.output_file + if args.file_partition > 1: + out_file += '0' + print("Transform finished, output files refer: {}".format(out_file)) diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\235\203\351\207\215\345\220\210\345\271\266/transform_ckpt.py" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\235\203\351\207\215\345\220\210\345\271\266/transform_ckpt.py" new file mode 100644 index 00000000..67910821 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\235\203\351\207\215\345\220\210\345\271\266/transform_ckpt.py" @@ -0,0 +1,89 @@ +# Copyright 2023 Huawei Technologies Co., Ltd +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================ +"""transform ckpt""" +import os +import argparse + +import mindspore as ms + +def get_strategy(startegy_path, rank_id=None): + """Merge strategy if strategy path is dir + + Args: + startegy_path (str): The path of stategy. + rank_id (int): The rank id of device. + + Returns: + None or strategy path + """ + if not startegy_path or startegy_path == "None": + return None + + assert os.path.exists(startegy_path), f'{startegy_path} not found!' + + if os.path.isfile(startegy_path): + return startegy_path + + if os.path.isdir(startegy_path): + if rank_id: + merge_path = os.path.join(startegy_path, f'merged_ckpt_strategy_{rank_id}.ckpt') + else: + merge_path = os.path.join(startegy_path, f'merged_ckpt_strategy.ckpt') + + if os.path.exists(merge_path): + os.remove(merge_path) + + ms.merge_pipeline_strategys(startegy_path, merge_path) + return merge_path + + return None + +if __name__ == '__main__': + parser = argparse.ArgumentParser() + parser.add_argument('--src_ckpt_strategy', + default="", + help='path of src ckpt strategy') + parser.add_argument('--dst_ckpt_strategy', + default="", + help='path of dst ckpt strategy') + parser.add_argument('--src_ckpt_dir', + default="", + type=str, + help='path of src ckpt') + parser.add_argument('--dst_ckpt_dir', + default="", + type=str, + help='path where to save dst ckpt') + parser.add_argument('--prefix', + default='checkpoint_', + type=str, + help='prefix of transformed checkpoint') + args = parser.parse_args() + + src_ckpt_strategy = get_strategy(args.src_ckpt_strategy) + dst_ckpt_strategy = get_strategy(args.dst_ckpt_strategy) + src_ckpt_dir = args.src_ckpt_dir + dst_ckpt_dir = args.dst_ckpt_dir + prefix = args.prefix + + print(f"src_ckpt_strategy: {src_ckpt_strategy}") + print(f"dst_ckpt_strategy: {dst_ckpt_strategy}") + print(f"src_ckpt_dir: {src_ckpt_dir}") + print(f"dst_ckpt_dir: {dst_ckpt_dir}") + print(f"prefix: {prefix}") + + print("......Start transform......") + ms.transform_checkpoints(src_ckpt_dir, dst_ckpt_dir, prefix, src_ckpt_strategy, dst_ckpt_strategy) + print("......Transform succeed!......") diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/run_llama3_8b_8k_800T_A2_64G_lora_256_base_eval.yaml" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/run_llama3_8b_8k_800T_A2_64G_lora_256_base_eval.yaml" new file mode 100644 index 00000000..fa378e99 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/run_llama3_8b_8k_800T_A2_64G_lora_256_base_eval.yaml" @@ -0,0 +1,218 @@ +seed: 0 +output_dir: './output' # path to save checkpoint/strategy +load_checkpoint: '/home/ma-user/work/topic3/new_llama3_8b_lora.ckpt' +src_strategy_path_or_dir: '' +auto_trans_ckpt: False # If true, auto transform load_checkpoint to load in distributed model +only_save_strategy: False +resume_training: False +run_mode: 'finetune' + +# trainer config +trainer: + type: CausalLanguageModelingTrainer + model_name: 'llama3_8b' + +# runner config +runner_config: + epochs: 5 + batch_size: 16 + sink_mode: True + sink_size: 2 + +# optimizer +optimizer: + type: FP32StateAdamWeightDecay + beta1: 0.9 + beta2: 0.95 + eps: 1.e-8 + +# lr sechdule +lr_schedule: + type: CosineWithWarmUpLR + learning_rate: 1.e-5 + lr_end: 0.0 + warmup_ratio: 0.03 + total_steps: -1 # -1 means it will load the total steps of the dataset + +# dataset +train_dataset: &train_dataset + data_loader: + type: MindDataset + dataset_dir: "" + shuffle: True + input_columns: ["input_ids", "labels"] # "input_ids", "labels" , labels are used in instruction finetune. + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: True + batch_size: 16 + repeat: 1 + numa_enable: False + prefetch_size: 1 +train_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *train_dataset +# if True, do evaluate during the training process. if false, do nothing. +# note that the task trainer should support _evaluate_in_training function. +do_eval: False + +# eval dataset +eval_dataset: &eval_dataset + data_loader: + type: MindDataset + dataset_dir: "" + shuffle: False + input_columns: ["input_ids", "labels"] + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: False + repeat: 1 + numa_enable: False + prefetch_size: 1 +eval_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *eval_dataset + +use_parallel: False +# parallel context config +parallel: + parallel_mode: 1 # 0-data parallel, 1-semi-auto parallel, 2-auto parallel, 3-hybrid parallel + gradients_mean: False + enable_alltoall: False + full_batch: True + search_mode: "sharding_propagation" + enable_parallel_optimizer: True + strategy_ckpt_config: + save_file: "./ckpt_strategy.ckpt" + only_trainable_params: False + parallel_optimizer_config: + gradient_accumulation_shard: False + parallel_optimizer_threshold: 64 +# default parallel of device num = 8 for Atlas 800T A2 +parallel_config: + data_parallel: 1 + model_parallel: 4 + pipeline_stage: 1 + use_seq_parallel: False + micro_batch_num: 1 + vocab_emb_dp: True + gradient_aggregation_group: 4 +# when model parallel is greater than 1, we can set micro_batch_interleave_num=2, that may accelerate the train process. +micro_batch_interleave_num: 1 + +# recompute config +recompute_config: + recompute: True + select_recompute: False + parallel_optimizer_comm_recompute: False + mp_comm_recompute: True + recompute_slice_activation: True + +# callbacks +callbacks: + - type: MFLossMonitor + - type: CheckpointMointor + prefix: "llama3_8b" + save_checkpoint_steps: 1400 + integrated_save: False + async_save: False + - type: ObsMonitor + +# mindspore context init config +context: + mode: 0 #0--Graph Mode; 1--Pynative Mode + device_target: "Ascend" + enable_graph_kernel: False + graph_kernel_flags: "--disable_expand_ops=Softmax,Dropout --enable_parallel_fusion=true --reduce_fuse_depth=8 --enable_auto_tensor_inplace=true" + max_call_depth: 10000 + max_device_memory: "28GB" + save_graphs: False + save_graphs_path: "./graph" + device_id: 0 + runtime_num_threads: 1 + +# model config +model: + model_config: + type: LlamaConfig + batch_size: 16 # add for increase predict + seq_length: 8192 + hidden_size: 4096 + num_layers: 32 + num_heads: 32 + n_kv_heads: 8 + vocab_size: 128256 + intermediate_size: 14336 + rms_norm_eps: 1.0e-5 + bos_token_id: 128000 + eos_token_id: 128001 + pad_token_id: 128002 + ignore_token_id: -100 + compute_dtype: "float16" + layernorm_compute_type: "float32" + softmax_compute_type: "float32" + rotary_dtype: "float32" + param_init_type: "float16" + use_past: True + scaling_factor: 1.0 + theta: 500000 + extend_method: "None" # support "None", "PI", "NTK" + use_flash_attention: True # FA can accelerate training or finetune + block_size: 64 + offset: 0 + fine_grain_interleave: 1 + checkpoint_name_or_path: "/home/ma-user/work/ms_ckpt/llama3-8B.ckpt" + repetition_penalty: 1 + max_decode_length: 700 + max_new_tokens: 20 + top_k: 3 + top_p: 1 + do_sample: False + is_dynamic: False + pet_config: + pet_type: lora + # configuration of lora + lora_rank: 8 + lora_alpha: 16 + lora_dropout: 0.0 + target_modules: '.*wq|.*wv' + arch: + type: LlamaForCausalLM + +processor: + return_tensors: ms + tokenizer: + model_max_length: 8192 + vocab_file: "/home/ma-user/work/tokenizer.model" + pad_token: "<|reserved_special_token_0|>" + type: Llama3Tokenizer + type: LlamaProcessor + +# metric +metric: + type: EmF1Metric + +# wrapper cell config +runner_wrapper: + type: MFTrainOneStepCell + scale_sense: 1.0 + use_clip_grad: True + +eval_callbacks: + - type: ObsMonitor + +auto_tune: False +filepath_prefix: './autotune' +autotune_per_step: 10 + +profile: False +profile_start_step: 4 +profile_stop_step: 8 +init_start_profile: False +profile_communication: False +profile_memory: True +layer_scale: False +layer_decay: 0.65 +lr_scale_factor: 256 + +# aicc +remote_save_url: "Please input obs url on AICC platform." diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/squad_data_process.py" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/squad_data_process.py" new file mode 100644 index 00000000..b184e17b --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\346\250\241\345\236\213\350\257\204\344\274\260/squad_data_process.py" @@ -0,0 +1,148 @@ +# Copyright 2023 Huawei Technologies Co., Ltd +# +# Licensed under the Apache License, Version 2.0 (the "License"); +# you may not use this file except in compliance with the License. +# You may obtain a copy of the License at +# +# http://www.apache.org/licenses/LICENSE-2.0 +# +# Unless required by applicable law or agreed to in writing, software +# distributed under the License is distributed on an "AS IS" BASIS, +# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. +# See the License for the specific language governing permissions and +# limitations under the License. +# ============================================================================ +"""Data process for SQuAD Dataset""" +import argparse +import json +import collections +import copy +import logging +import pathlib + +import numpy as np +from mindspore.mindrecord import FileWriter +from mindformers import AutoTokenizer + +IGNORE_TOKEN_ID = -100 + + +def write_instance_to_file(writer, instance): + """write the instance to file""" + input_ids = instance["input_ids"] + label = instance["labels"] + + features = collections.OrderedDict() + features["input_ids"] = np.asarray(input_ids).astype(np.int32) + features["labels"] = np.asarray(label).astype(np.int32) + + writer.write_raw_data([features]) + return features + + +def main(): + parser = argparse.ArgumentParser() + parser.add_argument("--input_file", type=str, default="./squad/train-v1.1.json", required=False, + help='Input raw json file. ') + parser.add_argument("--output_file", type=str, default="./squad/recode_train.mindrecord", required=False, + help='Output MindRecord file. ') + parser.add_argument("--mode", type=str, default="train", + help='Set Data for train or eval.') + parser.add_argument("--max_length", type=int, default=2048, help='Maximum sequence length. ') + parser.add_argument("--tokenizer_type", type=str, default="llama_7b", + help="Tokenizer type, can be set to any tokenizer " + "if its relevant model supports prompt text classification. ") + + args = parser.parse_args() + + logging.info("***** Reading from input files *****") + logging.info("Input File: %s", args.input_file) + + tokenizer = AutoTokenizer.from_pretrained(args.tokenizer_type) + + input_file = pathlib.Path(args.input_file) + + with input_file.open() as f: + file = json.load(f) + + sources = [] + targets = [] + for data in file["data"]: + for paragraph in data["paragraphs"]: + passage = paragraph["context"] + query = paragraph["qas"][0]["question"] + answer = paragraph["qas"][0]["answers"][0]["text"] + + input_str = f"Read the passage and answer the question below.\n\n### Instruction:\n{passage}\n\n### Input:\n{query}\n\n### Response:" + sources.append(input_str) + targets.append(answer) + + logging.info("***** Writing to output files *****") + logging.info("Output File: %s", args.output_file) + + writer = FileWriter(args.output_file, 1) + data_schema = {"input_ids": {"type": "int32", "shape": [-1]}, + "labels": {"type": "int32", "shape": [-1]} + } + writer.add_schema(data_schema, "lm-schema") + + total_written = 0 + # for eval + if args.mode == "eval": + if hasattr(tokenizer, 'add_bos_token'): + tokenizer.add_bos_token = True + if hasattr(tokenizer, 'add_eos_token'): + tokenizer.add_eos_token = False + for prompt, answer in zip(sources, targets): + total_written += 1 + input_ids = tokenizer.encode(prompt, add_special_tokens=True) + if len(input_ids) >= args.max_length: + input_ids = input_ids[:args.max_length] + else: + input_ids = np.pad(input_ids, (0, args.max_length - len(input_ids)), 'constant', + constant_values=(tokenizer.pad_token_id, tokenizer.pad_token_id)) + + input_ids = np.array(input_ids).reshape(1, -1) + + label_id = tokenizer.encode(answer, add_special_tokens=False) + label_id = np.pad(label_id, (0, args.max_length - len(label_id)), 'constant', + constant_values=(tokenizer.pad_token_id, tokenizer.pad_token_id)) + label_id = np.array(label_id).reshape(1, -1) + instance = {"input_ids": input_ids, "labels": label_id} + + write_instance_to_file(writer, instance=instance) + # for train/finetune + elif args.mode == "train": + if hasattr(tokenizer, 'add_bos_token'): + tokenizer.add_bos_token = True + if hasattr(tokenizer, 'add_eos_token'): + tokenizer.add_eos_token = True + for prompt, answer in zip(sources, targets): + total_written += 1 + concated_qa = prompt + answer + input_ids = tokenizer.encode(concated_qa, add_special_tokens=True) + input_ids = np.array(input_ids) + + prompt_ids = tokenizer.encode(prompt, add_special_tokens=False) + prompt_ids = np.array(prompt_ids) + prompt_length = len(prompt_ids) + concat_length = len(input_ids) + + pad_length = args.max_length + 1 - concat_length + input_ids_new = np.pad(input_ids, (0, pad_length), 'constant', + constant_values=(tokenizer.pad_token_id, tokenizer.pad_token_id)) + label_id_new = copy.deepcopy(input_ids_new) + label_id_new[:prompt_length] = IGNORE_TOKEN_ID + label_id_new[-pad_length:] = IGNORE_TOKEN_ID + instance = {"input_ids": input_ids_new, "labels": label_id_new} + write_instance_to_file(writer, instance=instance) + else: + logging.error("No mode named %s, please set mode as train/eval.", args.mode) + + writer.commit() + logging.info("Wrote %d total instances", total_written) + + +if __name__ == "__main__": + logging.basicConfig(level=logging.INFO) + main() diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\351\205\215\347\275\256\346\226\207\344\273\266/config.yaml" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\351\205\215\347\275\256\346\226\207\344\273\266/config.yaml" new file mode 100644 index 00000000..40f1c955 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\345\216\237\347\240\201/\351\205\215\347\275\256\346\226\207\344\273\266/config.yaml" @@ -0,0 +1,206 @@ +seed: 0 +output_dir: './output' # path to save checkpoint/strategy +load_checkpoint: '/home/ma-user/work/llama3-8B.ckpt' +src_strategy_path_or_dir: '' +auto_trans_ckpt: False # If true, auto transform load_checkpoint to load in distributed model +only_save_strategy: False +resume_training: False +run_mode: 'finetune' + +# trainer config +trainer: + type: CausalLanguageModelingTrainer + model_name: 'llama3_8b' + +# runner config +runner_config: + epochs: 10 + batch_size: 32 + sink_mode: True + sink_size: 2 + +# optimizer +optimizer: + type: FP32StateAdamWeightDecay + beta1: 0.9 + beta2: 0.95 + eps: 1.e-8 + +# lr sechdule +lr_schedule: + type: CosineWithWarmUpLR + learning_rate: 3.e-5 + lr_end: 1.e-6 + warmup_ratio: 0.1 + total_steps: -1 # -1 means it will load the total steps of the dataset + +# dataset +train_dataset: &train_dataset + data_loader: + type: MindDataset + dataset_dir: "/home/ma-user/work/train-fastchat256-mindrecore.mindrecord" + shuffle: True + input_columns: ["input_ids", "labels"] # "input_ids", "labels" , labels are used in instruction finetune. + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: True + batch_size: 1 + repeat: 1 + numa_enable: False + prefetch_size: 1 +train_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *train_dataset +# if True, do evaluate during the training process. if false, do nothing. +# note that the task trainer should support _evaluate_in_training function. +do_eval: False + +# eval dataset +eval_dataset: &eval_dataset + data_loader: + type: MindDataset + dataset_dir: "" + shuffle: False + input_columns: ["input_ids"] + num_parallel_workers: 8 + python_multiprocessing: False + drop_remainder: False + repeat: 1 + numa_enable: False + prefetch_size: 1 +eval_dataset_task: + type: CausalLanguageModelDataset + dataset_config: *eval_dataset + +use_parallel: True +# parallel context config +parallel: + parallel_mode: 1 # 0-data parallel, 1-semi-auto parallel, 2-auto parallel, 3-hybrid parallel + gradients_mean: False + enable_alltoall: False + full_batch: True + search_mode: "sharding_propagation" + enable_parallel_optimizer: True + strategy_ckpt_config: + save_file: "./ckpt_strategy.ckpt" + only_trainable_params: False + parallel_optimizer_config: + gradient_accumulation_shard: False + parallel_optimizer_threshold: 64 +# default parallel of device num = 8 for Atlas 800T A2 +parallel_config: + data_parallel: 1 + model_parallel: 4 + pipeline_stage: 1 + use_seq_parallel: False + micro_batch_num: 1 + vocab_emb_dp: True + gradient_aggregation_group: 4 +# when model parallel is greater than 1, we can set micro_batch_interleave_num=2, that may accelerate the train process. +micro_batch_interleave_num: 1 + +# recompute config +recompute_config: + recompute: True + select_recompute: False + parallel_optimizer_comm_recompute: False + mp_comm_recompute: True + recompute_slice_activation: True + +# callbacks +callbacks: + - type: MFLossMonitor + - type: CheckpointMointor + prefix: "llama3_8b" + save_checkpoint_steps: 1400 + integrated_save: False + async_save: False + - type: ObsMonitor + +# mindspore context init config +context: + mode: 0 #0--Graph Mode; 1--Pynative Mode + device_target: "Ascend" + enable_graph_kernel: False + graph_kernel_flags: "--disable_expand_ops=Softmax,Dropout --enable_parallel_fusion=true --reduce_fuse_depth=8 --enable_auto_tensor_inplace=true" + max_call_depth: 10000 + max_device_memory: "26GB" + save_graphs: False + save_graphs_path: "./graph" + device_id: 0 + runtime_num_threads: 1 + +# model config +model: + model_config: + type: LlamaConfig + batch_size: 1 # add for increase predict + seq_length: 256 + hidden_size: 4096 + num_layers: 32 + num_heads: 32 + n_kv_heads: 8 + vocab_size: 128256 + intermediate_size: 14336 + rms_norm_eps: 1.0e-5 + bos_token_id: 128000 + eos_token_id: 128001 + pad_token_id: 128002 + ignore_token_id: -100 + compute_dtype: "bfloat16" + layernorm_compute_type: "float32" + softmax_compute_type: "float32" + rotary_dtype: "float32" + param_init_type: "bfloat16" + use_past: False + scaling_factor: 1.0 + theta: 500000 + extend_method: "None" # support "None", "PI", "NTK" + use_flash_attention: True # FA can accelerate training or finetune + offset: 0 + fine_grain_interleave: 1 + checkpoint_name_or_path: "/home/ma-user/work/ms_ckpt/llama3-8B.ckpt" + repetition_penalty: 1 + max_decode_length: 512 + top_k: 3 + top_p: 1 + do_sample: False + pet_config: + pet_type: lora + # configuration of lora + lora_rank: 8 + lora_alpha: 16 + lora_dropout: 0.05 + target_modules: '.*wq|.*wv' + arch: + type: LlamaForCausalLM + +# metric +metric: + type: PerplexityMetric + +# wrapper cell config +runner_wrapper: + type: MFTrainOneStepCell + scale_sense: 1.0 + use_clip_grad: True + +eval_callbacks: + - type: ObsMonitor + +auto_tune: False +filepath_prefix: './autotune' +autotune_per_step: 10 + +profile: False +profile_start_step: 4 +profile_stop_step: 8 +init_start_profile: False +profile_communication: False +profile_memory: True +layer_scale: False +layer_decay: 0.65 +lr_scale_factor: 256 + +# aicc +remote_save_url: "Please input obs url on AICC platform." diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/scheduler.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/scheduler.log" new file mode 100644 index 00000000..a635bcb6 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/scheduler.log" @@ -0,0 +1,10230 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:19.321.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-25-18:09:20.322.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 0(role: MS_WORKER), rank id: 0 is registered successfully. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-25-18:09:20.560.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 3(role: MS_WORKER), rank id: 3 is registered successfully. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-25-18:09:20.659.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 1(role: MS_WORKER), rank id: 1 is registered successfully. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-25-18:09:21.409.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:227] ProcessRegister] The new node: 2(role: MS_WORKER), rank id: 2 is registered successfully. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-25-18:09:21.409.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:666] ReassignNodeRank] Rank ids are already set by numeric node ids, and this is not CM initialization. No need to reassign them. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:22.321.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:22.321.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:22.321.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:27.321.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:27.321.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:32.321.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:32.321.775 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:37.321.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:37.322.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:42.322.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:42.322.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:47.322.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:47.322.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:52.322.655 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:52.322.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:57.322.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:09:57.322.961 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:02.323.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:02.323.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:07.323.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:07.323.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:12.324.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:12.324.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:17.324.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:17.324.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:22.324.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:22.324.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:27.324.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:27.324.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:32.325.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:32.325.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:37.325.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:37.325.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:42.325.530 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:42.325.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:47.325.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:47.325.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:52.326.025 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:52.326.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:57.326.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:10:57.326.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:02.326.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:02.326.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:07.326.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:07.326.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:12.326.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:12.327.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:17.327.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:17.327.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:22.327.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:22.327.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:27.327.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:27.327.757 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:32.327.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:32.328.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:37.328.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:37.328.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:42.328.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:42.328.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:47.328.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:47.328.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:52.328.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:52.329.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:57.329.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:11:57.329.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:02.329.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:02.329.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:07.329.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:07.329.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:12.329.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:12.330.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:17.330.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:17.330.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:22.333.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:22.333.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:27.333.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:27.333.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:32.333.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:32.333.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:37.334.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:37.334.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:42.334.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:42.334.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:47.334.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:47.334.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:52.334.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:52.334.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:57.334.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:12:57.334.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:02.335.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:02.335.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:07.335.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:07.335.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:12.335.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:12.335.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:17.335.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:17.335.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:22.336.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:22.336.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:27.336.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:27.336.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:32.336.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:32.336.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:37.336.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:37.336.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:42.337.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:42.337.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:47.337.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:47.337.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:52.337.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:52.337.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:57.337.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:13:57.337.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:02.338.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:02.338.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:07.338.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:07.338.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:12.338.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:12.338.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:17.338.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:17.338.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:22.339.023 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:22.339.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:27.339.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:27.339.320 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:32.339.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:32.339.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:37.339.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:37.339.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:42.340.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:42.340.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:47.340.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:47.340.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:52.340.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:52.340.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:57.340.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:14:57.340.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:02.340.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:02.341.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:07.341.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:07.341.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:12.341.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:12.341.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:17.341.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:17.341.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:22.341.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:22.342.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:27.342.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:27.342.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:32.342.457 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:32.342.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:37.342.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:37.342.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:42.342.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:42.343.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:47.343.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:47.343.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:52.343.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:52.343.523 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:57.343.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:15:57.344.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:02.344.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:02.344.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:07.344.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:07.344.845 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:12.345.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:12.345.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:17.345.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:17.345.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:22.345.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:22.345.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:27.345.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:27.345.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:32.345.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:32.346.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:37.346.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:37.346.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:42.346.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:42.346.529 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:47.346.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:47.346.775 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:52.346.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:52.346.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:57.347.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:16:57.347.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:02.347.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:02.347.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:07.347.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:07.347.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:12.347.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:12.347.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:17.348.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:17.348.184 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:22.348.345 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:22.348.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:27.348.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:27.348.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:32.348.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:32.348.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:37.349.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:37.349.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:42.349.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:42.349.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:47.349.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:47.349.580 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:52.349.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:52.349.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:57.349.971 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:17:57.350.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:02.350.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:02.350.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:07.350.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:07.350.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:12.350.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:12.350.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:17.350.914 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:17.351.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:22.351.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:22.351.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:27.351.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:27.351.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:32.351.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:32.351.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:37.351.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:37.351.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:42.352.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:42.352.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:47.352.345 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:47.352.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:52.352.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:52.352.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:57.352.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:18:57.352.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:02.353.025 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:02.353.103 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:07.353.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:07.353.324 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:12.353.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:12.353.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:17.353.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:17.353.770 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:22.353.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:22.353.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:27.354.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:27.354.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:32.354.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:32.354.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:37.354.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:37.354.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:42.354.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:42.354.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:47.355.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:47.355.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:52.355.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:52.355.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:57.355.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:19:57.355.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:02.355.710 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:02.355.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:07.356.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:07.357.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:12.357.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:12.357.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:17.357.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:17.357.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:22.357.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:22.357.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:27.357.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:27.358.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:32.358.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:32.358.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:37.358.361 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:37.358.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:42.358.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:42.358.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:47.358.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:47.358.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:52.359.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:52.359.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:57.359.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:20:57.359.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:02.359.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:02.359.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:07.359.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:07.359.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:12.360.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:12.360.141 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:17.360.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:17.360.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:22.360.516 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:22.360.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:27.360.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:27.360.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:32.360.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:32.361.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:37.361.257 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:37.361.356 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:42.361.501 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:42.361.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:47.361.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:47.361.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:52.361.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:52.361.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:57.362.111 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:21:57.362.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:02.362.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:02.362.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:07.362.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:07.362.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:12.362.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:12.362.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:17.363.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:17.363.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:22.363.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:22.363.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:27.363.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:27.363.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:32.363.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:32.363.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:37.364.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:37.364.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:42.364.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:42.364.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:47.364.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:47.364.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:52.364.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:52.364.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:57.364.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:22:57.365.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:02.365.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:02.365.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:07.365.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:07.365.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:12.365.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:12.365.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:17.365.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:17.366.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:22.366.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:22.366.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:27.366.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:27.366.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:32.366.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:32.366.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:37.366.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:37.367.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:42.367.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:42.367.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:47.367.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:47.367.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:52.367.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:52.367.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:57.367.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:23:57.368.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:02.368.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:02.368.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:07.368.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:07.368.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:12.368.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:12.368.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:17.368.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:17.369.004 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:22.369.160 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:22.369.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:27.369.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:27.369.523 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:32.369.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:32.369.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:37.369.910 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:37.369.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:42.370.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:42.370.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:47.370.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:47.370.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:52.370.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:52.370.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:57.370.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:24:57.370.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:02.370.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:02.371.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:07.371.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:07.371.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:12.371.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:12.371.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:17.371.678 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:17.371.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:22.371.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:22.371.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:27.372.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:27.372.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:32.372.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:32.372.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:37.372.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:37.372.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:42.372.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:42.372.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:47.372.951 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:47.373.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:52.373.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:52.373.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:57.373.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:25:57.373.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:02.373.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:02.373.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:07.373.913 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:07.373.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:12.374.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:12.374.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:17.374.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:17.374.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:22.374.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:22.374.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:27.374.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:27.374.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:32.374.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:32.375.044 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:37.375.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:37.375.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:42.375.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:42.375.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:47.375.599 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:47.375.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:52.375.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:52.375.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:57.376.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:26:57.376.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:02.376.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:02.376.320 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:07.376.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:07.376.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:12.376.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:12.377.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:17.377.566 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:17.377.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:22.377.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:22.377.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:27.377.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:27.378.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:32.378.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:32.378.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:37.378.426 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:37.378.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:42.378.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:42.378.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:47.378.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:47.378.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:52.379.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:52.379.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:57.379.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:27:57.379.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:02.379.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:02.379.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:07.379.988 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:07.380.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:12.380.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:12.380.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:17.380.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:17.380.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:22.380.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:22.380.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:27.381.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:27.381.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:32.381.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:32.381.871 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:37.382.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:37.383.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:42.383.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:42.383.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:47.383.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:47.383.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:52.383.742 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:52.383.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:57.383.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:28:57.384.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:02.384.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:02.384.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:07.384.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:07.384.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:12.384.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:12.384.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:17.384.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:17.384.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:22.385.083 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:22.385.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:27.385.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:27.385.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:32.385.513 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:32.385.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:37.385.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:37.385.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:42.386.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:42.386.216 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:47.386.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:47.386.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:52.386.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:52.386.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:57.386.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:29:57.386.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:02.386.993 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:02.387.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:07.387.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:07.387.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:12.387.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:12.387.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:17.387.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:17.387.691 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:22.387.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:22.388.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:27.388.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:27.388.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:32.388.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:32.388.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:37.388.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:37.388.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:42.388.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:42.388.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:47.389.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:47.389.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:52.389.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:52.389.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:57.389.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:30:57.389.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:02.389.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:02.389.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:07.389.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:07.389.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:12.390.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:12.390.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:17.390.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:17.390.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:22.390.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:22.390.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:27.390.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:27.390.845 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:32.390.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:32.391.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:37.391.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:37.391.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:42.391.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:42.391.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:47.391.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:47.391.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:52.391.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:52.392.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:57.392.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:31:57.392.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:02.392.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:02.392.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:07.392.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:07.393.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:12.393.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:12.393.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:17.393.794 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:17.393.850 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:22.394.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:22.394.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:27.394.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:27.394.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:32.394.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:32.394.478 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:37.394.669 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:37.394.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:42.394.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:42.395.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:47.395.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:47.395.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:52.395.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:52.395.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:57.395.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:32:57.395.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:02.395.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:02.396.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:07.396.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:07.396.219 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:12.396.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:12.396.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:17.396.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:17.396.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:22.396.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:22.396.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:27.397.007 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:27.397.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:32.397.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:32.398.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:37.398.157 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:37.398.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:42.398.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:42.398.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:47.398.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:47.398.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:52.398.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:52.398.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:57.398.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:33:57.399.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:02.399.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:02.400.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:07.400.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:07.400.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:12.400.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:12.400.471 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:17.400.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:17.400.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:22.400.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:22.400.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:27.401.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:27.401.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:32.401.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:32.401.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:37.401.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:37.401.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:42.401.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:42.401.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:47.401.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:47.402.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:52.402.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:52.402.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:57.402.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:34:57.402.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:02.402.608 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:02.402.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:07.403.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:07.403.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:12.403.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:12.403.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:17.403.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:17.403.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:22.404.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:22.404.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:27.404.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:27.404.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:32.404.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:32.404.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:37.404.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:37.404.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:42.404.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:42.404.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:47.405.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:47.405.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:52.405.371 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:52.405.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:57.405.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:35:57.405.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:02.405.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:02.405.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:07.406.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:07.406.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:12.406.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:12.406.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:17.406.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:17.406.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:22.406.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:22.406.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:27.406.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:27.407.044 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:32.407.913 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:32.407.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:37.408.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:37.408.262 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:42.408.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:42.408.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:47.408.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:47.408.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:52.408.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:52.408.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:57.409.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:36:57.409.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:02.409.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:02.409.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:07.409.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:07.409.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:12.409.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:12.409.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:17.410.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:17.410.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:22.410.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:22.410.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:27.410.572 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:27.410.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:32.411.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:32.411.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:37.412.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:37.412.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:42.412.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:42.412.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:47.412.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:47.412.580 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:52.412.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:52.412.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:57.412.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:37:57.412.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:02.413.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:02.413.200 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:07.413.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:07.413.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:12.413.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:12.413.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:17.413.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:17.414.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:22.414.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:22.414.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:27.414.381 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:27.414.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:32.414.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:32.414.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:37.414.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:37.414.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:42.415.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:42.415.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:47.415.247 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:47.415.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:52.415.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:52.415.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:57.415.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:38:57.415.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:02.415.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:02.416.056 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:07.416.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:07.416.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:12.416.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:12.416.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:17.416.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:17.416.701 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:22.416.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:22.416.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:27.417.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:27.417.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:32.417.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:32.417.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:37.417.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:37.417.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:42.417.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:42.417.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:47.417.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:47.418.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:52.418.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:52.418.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:57.418.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:39:57.418.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:02.418.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:02.418.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:07.418.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:07.418.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:12.419.083 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:12.419.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:17.419.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:17.419.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:22.419.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:22.419.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:27.419.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:27.419.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:32.419.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:32.419.966 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:37.420.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:37.420.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:42.420.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:42.420.448 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:47.420.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:47.420.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:52.420.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:52.420.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:57.420.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:40:57.421.049 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:02.421.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:02.421.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:07.421.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:07.421.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:12.421.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:12.421.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:17.421.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:17.422.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:22.422.809 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:22.422.980 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:27.423.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:27.423.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:32.423.351 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:32.423.421 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:37.423.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:37.423.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:42.423.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:42.423.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:47.424.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:47.424.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:52.424.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:52.424.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:57.424.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:41:57.424.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:02.424.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:02.424.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:07.424.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:07.425.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:12.425.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:12.425.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:17.425.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:17.425.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:22.425.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:22.425.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:27.425.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:27.425.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:32.426.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:32.426.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:37.426.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:37.426.392 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:42.426.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:42.426.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:47.426.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:47.426.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:52.427.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:52.427.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:57.427.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:42:57.427.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:02.427.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:02.427.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:07.427.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:07.427.787 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:12.427.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:12.427.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:17.428.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:17.428.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:22.428.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:22.428.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:27.428.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:27.428.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:32.429.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:32.429.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:37.429.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:37.429.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:42.429.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:42.429.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:47.429.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:47.429.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:52.430.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:52.430.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:57.430.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:43:57.430.440 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:02.430.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:02.430.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:07.430.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:07.430.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:12.431.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:12.431.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:17.431.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:17.431.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:22.431.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:22.431.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:27.431.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:27.431.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:32.431.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:32.432.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:37.432.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:37.432.242 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:42.432.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:42.432.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:47.432.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:47.433.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:52.433.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:52.433.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:57.433.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:44:57.433.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:02.433.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:02.433.932 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:07.434.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:07.434.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:12.434.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:12.434.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:17.434.569 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:17.434.666 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:22.434.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:22.435.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:27.435.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:27.435.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:32.435.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:32.435.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:37.435.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:37.435.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:42.435.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:42.435.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:47.436.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:47.436.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:52.436.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:52.436.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:57.436.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:45:57.436.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:02.436.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:02.436.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:07.436.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:07.436.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:12.437.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:12.437.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:17.438.082 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:17.438.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:22.438.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:22.438.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:27.438.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:27.438.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:32.438.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:32.438.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:37.438.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:37.439.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:42.439.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:42.439.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:47.439.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:47.439.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:52.439.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:52.439.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:57.439.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:46:57.440.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:02.440.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:02.440.267 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:07.440.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:07.440.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:12.440.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:12.440.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:17.440.938 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:17.441.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:22.441.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:22.441.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:27.441.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:27.441.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:32.441.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:32.442.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:37.442.172 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:37.442.986 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:42.443.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:42.443.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:47.443.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:47.443.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:52.443.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:52.443.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:57.443.913 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:47:57.443.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:02.444.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:02.444.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:07.444.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:07.444.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:12.444.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:12.444.636 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:17.444.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:17.444.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:22.445.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:22.445.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:27.445.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:27.445.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:32.445.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:32.445.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:37.445.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:37.445.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:42.445.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:42.445.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:47.446.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:47.446.184 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:52.446.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:52.446.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:57.446.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:48:57.446.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:02.446.738 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:02.447.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:07.447.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:07.447.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:12.447.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:12.447.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:17.448.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:17.448.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:22.448.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:22.448.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:27.448.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:27.448.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:32.448.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:32.448.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:37.448.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:37.448.989 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:42.449.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:42.449.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:47.449.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:47.449.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:52.449.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:52.449.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:57.449.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:49:57.449.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:02.450.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:02.450.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:07.450.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:07.450.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:12.450.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:12.450.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:17.450.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:17.450.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:22.450.951 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:22.451.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:27.451.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:27.451.238 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:32.451.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:32.451.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:37.451.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:37.451.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:42.451.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:42.451.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:47.452.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:47.452.085 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:52.452.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:52.452.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:57.453.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:50:57.453.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:02.453.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:02.453.402 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:07.453.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:07.453.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:12.453.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:12.453.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:17.453.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:17.454.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:22.454.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:22.454.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:27.454.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:27.454.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:32.454.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:32.454.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:37.454.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:37.455.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:42.455.160 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:42.455.233 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:47.455.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:47.455.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:52.455.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:52.455.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:57.455.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:51:57.455.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:02.456.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:02.456.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:07.456.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:07.456.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:12.457.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:12.457.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:17.458.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:17.458.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:22.458.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:22.458.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:27.458.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:27.458.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:32.458.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:32.459.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:37.459.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:37.459.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:42.460.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:42.460.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:47.460.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:47.460.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:52.460.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:52.460.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:57.460.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:52:57.460.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:02.461.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:02.461.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:07.461.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:07.461.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:12.461.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:12.461.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:17.462.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:17.462.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:22.462.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:22.462.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:27.462.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:27.462.523 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:32.462.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:32.462.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:37.462.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:37.462.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:42.463.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:42.463.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:47.463.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:47.463.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:52.463.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:52.463.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:57.463.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:53:57.464.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:02.464.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:02.464.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:07.464.868 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:07.464.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:12.465.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:12.465.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:17.465.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:17.465.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:22.465.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:22.465.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:27.465.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:27.465.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:32.466.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:32.466.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:37.466.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:37.466.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:42.466.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:42.466.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:47.466.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:47.466.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:52.466.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:52.466.972 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:57.467.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:54:57.467.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:02.467.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:02.467.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:07.467.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:07.467.625 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:12.467.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:12.467.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:17.467.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:17.468.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:22.468.202 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:22.468.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:27.469.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:27.469.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:32.469.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:32.469.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:37.469.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:37.469.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:42.469.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:42.469.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:47.469.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:47.470.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:52.470.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:52.470.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:57.470.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:55:57.470.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:02.470.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:02.470.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:07.470.877 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:07.470.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:12.471.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:12.471.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:17.471.406 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:17.471.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:22.472.663 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:22.472.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:27.472.877 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:27.472.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:32.473.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:32.473.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:37.473.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:37.473.365 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:42.473.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:42.473.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:47.473.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:47.473.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:52.473.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:52.474.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:57.474.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:56:57.474.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:02.474.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:02.474.464 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:07.474.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:07.474.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:12.474.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:12.474.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:17.475.025 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:17.475.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:22.475.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:22.475.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:27.475.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:27.475.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:32.475.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:32.475.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:37.475.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:37.475.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:42.476.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:42.476.192 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:47.476.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:47.476.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:52.476.551 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:52.476.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:57.476.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:57:57.476.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:02.476.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:02.477.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:07.477.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:07.477.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:12.477.416 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:12.477.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:17.477.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:17.477.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:22.477.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:22.477.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:27.478.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:27.478.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:32.478.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:32.478.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:37.478.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:37.478.543 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:42.478.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:42.478.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:47.478.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:47.478.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:52.479.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:52.480.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:57.480.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:58:57.480.224 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:02.480.378 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:02.480.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:07.480.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:07.480.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:12.480.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:12.480.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:17.481.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:17.481.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:22.481.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:22.481.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:27.481.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:27.481.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:32.481.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:32.481.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:37.481.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:37.482.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:42.482.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:42.482.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:47.482.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:47.482.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:52.482.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:52.482.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:57.482.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-18:59:57.482.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:02.483.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:02.483.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:07.483.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:07.483.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:12.483.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:12.483.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:17.483.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:17.484.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:22.484.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:22.484.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:27.484.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:27.485.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:32.485.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:32.485.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:37.485.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:37.485.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:42.485.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:42.485.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:47.485.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:47.485.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:52.485.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:52.486.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:57.486.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:00:57.486.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:02.486.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:02.486.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:07.486.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:07.486.675 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:12.486.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:12.486.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:17.487.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:17.487.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:22.487.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:22.487.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:27.487.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:27.487.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:32.487.759 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:32.487.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:37.487.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:37.488.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:42.488.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:42.488.867 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:47.489.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:47.489.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:52.489.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:52.489.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:57.489.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:01:57.489.603 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:02.489.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:02.489.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:07.489.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:07.490.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:12.490.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:12.490.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:17.490.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:17.490.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:22.490.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:22.490.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:27.490.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:27.490.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:32.491.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:32.491.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:37.491.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:37.491.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:42.491.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:42.491.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:47.491.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:47.491.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:52.492.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:52.492.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:57.492.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:02:57.492.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:02.492.453 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:02.492.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:07.492.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:07.492.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:12.492.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:12.818.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:17.818.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:17.822.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:22.822.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:22.824.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:27.824.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:27.826.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:32.826.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:32.826.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:37.826.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:37.826.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:42.826.719 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:42.827.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:47.827.877 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:47.827.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:52.828.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:52.830.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:57.830.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:03:57.833.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:02.833.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:02.833.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:07.876.932 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:07.878.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:12.878.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:12.881.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:17.881.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:17.882.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:22.882.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:22.883.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:27.883.935 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:27.890.913 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:32.891.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:32.891.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:37.891.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:37.891.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:42.923.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:42.924.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:47.924.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:47.929.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:52.929.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:52.929.818 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:57.929.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:04:57.932.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:02.932.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:02.932.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:07.932.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:07.932.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:12.932.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:12.935.511 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:17.935.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:17.935.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:22.935.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:22.935.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:27.936.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:27.936.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:32.936.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:32.936.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:37.936.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:37.936.603 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:42.936.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:42.936.814 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:47.936.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:47.937.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:52.937.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:52.937.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:57.937.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:05:57.937.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:02.937.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:02.937.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:07.937.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:07.937.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:12.938.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:12.938.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:17.938.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:17.938.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:22.938.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:22.938.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:27.938.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:27.938.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:32.938.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:32.939.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:37.939.163 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:37.939.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:42.940.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:42.940.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:47.941.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:47.941.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:52.941.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:52.941.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:57.942.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:06:57.943.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:02.943.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:02.943.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:07.943.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:07.943.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:12.943.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:12.943.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:17.943.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:17.943.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:22.944.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:22.944.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:27.944.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:27.944.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:32.944.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:32.944.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:37.944.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:37.944.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:42.944.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:42.945.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:47.945.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:47.945.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:52.945.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:52.945.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:57.945.780 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:07:57.945.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:02.946.045 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:02.946.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:07.946.280 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:07.946.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:12.946.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:12.946.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:17.946.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:17.946.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:22.947.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:22.947.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:27.947.293 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:27.947.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:32.947.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:32.947.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:37.947.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:37.947.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:42.947.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:42.947.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:47.948.168 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:47.948.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:52.948.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:52.948.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:57.948.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:08:57.948.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:02.948.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:02.948.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:07.949.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:07.949.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:12.949.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:12.949.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:17.949.560 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:17.949.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:22.949.779 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:22.949.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:27.950.010 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:27.950.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:32.950.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:32.950.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:37.951.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:37.951.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:42.951.938 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:42.952.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:47.952.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:47.952.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:52.952.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:52.952.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:57.952.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:09:57.952.799 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:02.952.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:02.953.023 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:07.953.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:07.953.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:12.954.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:12.954.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:17.954.243 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:17.954.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:22.954.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:22.954.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:27.954.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:27.954.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:32.954.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:32.955.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:37.955.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:37.955.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:42.955.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:42.955.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:47.955.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:47.955.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:52.955.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:52.956.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:57.956.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:10:57.956.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:02.956.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:02.956.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:07.956.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:07.956.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:12.956.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:12.957.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:17.957.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:17.957.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:22.957.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:22.957.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:27.957.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:27.957.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:32.957.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:32.958.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:37.958.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:37.958.293 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:42.958.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:42.958.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:47.958.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:47.958.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:52.958.926 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:52.958.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:57.959.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:11:57.959.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:02.959.362 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:02.959.459 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:07.959.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:07.959.675 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:12.959.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:12.959.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:17.960.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:17.960.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:22.960.297 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:22.960.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:27.960.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:27.960.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:32.960.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:32.960.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:37.961.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:37.961.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:42.961.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:42.961.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:47.961.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:47.961.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:52.961.719 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:52.961.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:57.961.960 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:12:57.962.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:02.962.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:02.962.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:07.963.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:07.963.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:12.963.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:12.963.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:17.963.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:17.963.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:22.963.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:22.963.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:27.963.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:27.964.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:32.964.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:32.964.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:37.964.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:37.964.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:42.964.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:42.964.751 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:47.964.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:47.964.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:52.965.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:52.965.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:57.965.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:13:57.965.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:02.965.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:02.965.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:07.966.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:07.966.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:12.966.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:12.966.401 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:17.966.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:17.966.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:22.966.751 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:22.966.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:27.967.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:27.967.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:32.967.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:32.967.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:37.967.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:37.967.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:42.967.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:42.967.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:47.967.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:47.968.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:52.968.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:52.968.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:57.968.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:14:57.968.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:02.968.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:02.968.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:07.968.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:07.968.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:12.969.129 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:12.969.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:17.969.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:17.969.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:22.969.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:22.969.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:27.969.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:27.969.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:32.969.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:32.969.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:37.970.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:37.970.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:42.970.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:42.970.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:47.970.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:47.972.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:52.972.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:52.972.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:57.972.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:15:57.972.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:02.972.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:02.972.655 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:07.972.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:07.972.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:12.973.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:12.973.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:17.973.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:17.973.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:22.973.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:22.973.540 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:27.973.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:27.974.448 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:32.974.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:32.974.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:37.974.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:37.974.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:42.975.108 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:42.975.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:47.975.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:47.975.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:52.975.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:52.975.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:57.975.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:16:57.975.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:02.976.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:02.976.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:07.976.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:07.976.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:12.976.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:12.976.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:17.976.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:17.976.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:22.976.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:22.976.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:27.977.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:27.977.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:32.979.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:32.979.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:37.979.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:37.979.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:42.979.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:42.979.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:47.979.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:47.979.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:52.980.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:52.980.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:57.980.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:17:57.981.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:02.981.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:02.981.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:07.981.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:07.981.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:12.981.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:12.981.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:17.981.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:17.981.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:22.982.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:22.982.171 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:27.982.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:27.982.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:32.982.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:32.982.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:37.982.766 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:37.982.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:42.982.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:42.983.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:47.983.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:47.983.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:52.983.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:52.983.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:57.983.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:18:57.983.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:02.983.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:02.983.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:07.984.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:07.984.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:12.984.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:12.984.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:17.984.571 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:17.985.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:22.985.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:22.985.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:27.986.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:27.986.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:32.986.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:32.986.663 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:37.987.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:37.987.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:42.987.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:42.987.691 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:47.987.843 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:47.987.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:52.988.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:52.988.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:57.988.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:19:57.988.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:02.988.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:02.988.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:07.988.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:07.988.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:12.989.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:12.989.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:17.989.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:17.989.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:22.990.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:22.990.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:27.990.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:27.990.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:32.990.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:32.990.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:37.990.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:37.990.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:42.990.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:42.991.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:47.991.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:47.991.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:52.991.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:52.992.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:57.992.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:20:57.992.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:02.992.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:02.992.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:07.992.658 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:07.992.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:12.992.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:12.992.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:17.993.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:17.993.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:22.993.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:22.993.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:27.993.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:27.993.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:32.993.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:32.993.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:37.994.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:37.994.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:42.994.273 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:42.994.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:47.994.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:47.994.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:52.994.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:52.994.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:57.994.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:21:57.995.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:02.995.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:02.995.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:07.995.416 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:07.996.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:12.996.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:12.996.433 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:17.996.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:17.996.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:22.996.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:22.996.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:27.997.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:27.997.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:32.997.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:32.997.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:37.997.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:37.997.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:42.997.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:42.997.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:47.997.951 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:47.998.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:52.998.852 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:52.998.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:57.999.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:22:57.999.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:02.999.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:02.999.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:07.999.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:07.999.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:12.999.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:12.999.770 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:17.999.914 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:17.999.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:23.000.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:23.000.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:28.000.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:28.000.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:33.000.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:33.000.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:38.001.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:38.001.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:43.001.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:43.001.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:48.001.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:48.001.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:53.001.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:53.002.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:58.002.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:23:58.002.300 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:03.002.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:03.002.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:08.002.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:08.002.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:13.002.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:13.003.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:18.003.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:18.003.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:23.003.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:23.003.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:28.004.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:28.004.216 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:33.004.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:33.004.464 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:38.004.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:38.004.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:43.004.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:43.004.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:48.005.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:48.005.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:53.005.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:53.005.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:58.005.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:24:58.005.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:03.005.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:03.006.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:08.006.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:08.006.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:13.007.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:13.007.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:18.007.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:18.007.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:23.007.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:23.007.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:28.007.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:28.007.812 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:33.007.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:33.008.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:38.008.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:38.008.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:43.008.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:43.008.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:48.008.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:48.008.733 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:53.008.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:53.008.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:58.009.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:25:58.009.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:03.009.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:03.009.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:08.009.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:08.009.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:13.009.766 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:13.009.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:18.009.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:18.010.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:23.010.255 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:23.010.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:28.010.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:28.010.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:33.010.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:33.010.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:38.010.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:38.010.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:43.011.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:43.011.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:48.011.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:48.011.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:53.011.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:53.011.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:58.011.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:26:58.011.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:03.012.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:03.012.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:08.012.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:08.012.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:13.012.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:13.012.644 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:18.012.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:18.012.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:23.013.014 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:23.013.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:28.013.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:28.013.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:33.013.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:33.013.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:38.013.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:38.013.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:43.013.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:43.014.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:48.014.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:48.014.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:53.014.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:53.014.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:58.014.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:27:58.014.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:03.014.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:03.015.038 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:08.015.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:08.015.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:13.015.413 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:13.015.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:18.015.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:18.015.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:23.015.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:23.015.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:28.016.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:28.017.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:33.017.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:33.017.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:38.017.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:38.017.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:43.017.869 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:43.017.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:48.018.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:48.018.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:53.018.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:53.018.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:58.018.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:28:58.018.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:03.018.766 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:03.018.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:08.018.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:08.019.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:13.019.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:13.019.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:18.020.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:18.020.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:23.020.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:23.020.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:28.020.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:28.020.536 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:33.020.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:33.020.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:38.020.914 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:38.020.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:43.021.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:43.021.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:48.022.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:48.022.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:53.022.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:53.022.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:58.022.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:29:58.022.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:03.022.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:03.023.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:08.023.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:08.023.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:13.023.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:13.023.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:18.023.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:18.023.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:23.023.884 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:23.023.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:28.024.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:28.024.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:33.024.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:33.025.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:38.025.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:38.025.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:43.025.523 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:43.025.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:48.025.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:48.025.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:53.025.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:53.026.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:58.026.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:30:58.026.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:03.026.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:03.026.486 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:08.026.641 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:08.026.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:13.026.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:13.026.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:18.027.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:18.027.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:23.027.351 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:23.027.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:28.027.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:28.027.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:33.027.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:33.027.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:38.028.031 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:38.028.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:43.028.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:43.028.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:48.028.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:48.028.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:53.028.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:53.028.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:58.028.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:31:58.028.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:03.029.131 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:03.029.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:08.029.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:08.029.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:13.029.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:13.029.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:18.029.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:18.029.836 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:23.029.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:23.030.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:28.030.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:28.030.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:33.030.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:33.030.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:38.030.656 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:38.030.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:43.030.897 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:43.030.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:48.031.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:48.031.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:53.031.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:53.031.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:58.031.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:32:58.031.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:03.031.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:03.031.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:08.032.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:08.032.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:13.032.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:13.032.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:18.032.553 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:18.032.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:23.032.809 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:23.033.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:28.033.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:28.033.838 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:33.033.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:33.034.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:38.034.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:38.034.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:43.034.413 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:43.034.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:48.034.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:48.034.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:53.034.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:53.034.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:58.035.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:33:58.035.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:03.035.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:03.035.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:08.035.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:08.035.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:13.035.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:13.035.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:18.035.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:18.036.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:23.036.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:23.036.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:28.036.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:28.036.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:33.036.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:33.036.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:38.036.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:38.036.927 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:43.037.083 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:43.037.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:48.037.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:48.037.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:53.037.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:53.037.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:58.037.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:34:58.037.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:03.038.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:03.038.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:08.038.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:08.038.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:13.038.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:13.038.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:18.038.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:18.038.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:23.038.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:23.038.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:28.039.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:28.039.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:33.039.348 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:33.039.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:38.039.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:38.039.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:43.039.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:43.039.862 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:48.040.013 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:48.040.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:53.040.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:53.040.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:58.040.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:35:58.040.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:03.040.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:03.040.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:08.041.033 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:08.041.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:13.041.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:13.041.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:18.041.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:18.041.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:23.041.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:23.041.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:28.042.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:28.042.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:33.042.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:33.042.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:38.042.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:38.042.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:43.042.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:43.042.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:48.042.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:48.043.023 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:53.043.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:53.043.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:58.044.037 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:36:58.044.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:03.044.273 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:03.044.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:08.044.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:08.044.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:13.044.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:13.044.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:18.044.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:18.045.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:23.045.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:23.045.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:28.045.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:28.045.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:33.045.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:33.045.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:38.045.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:38.045.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:43.046.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:43.046.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:48.046.369 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:48.046.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:53.046.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:53.046.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:58.046.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:37:58.046.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:03.047.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:03.047.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:08.047.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:08.047.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:13.047.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:13.047.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:18.047.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:18.048.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:23.048.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:23.048.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:28.048.852 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:28.048.928 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:33.049.075 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:33.052.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:38.052.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:38.052.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:43.056.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:43.056.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:48.057.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:48.060.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:53.061.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:53.061.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:58.061.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:38:58.061.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:03.061.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:03.062.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:08.062.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:08.062.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:13.063.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:13.063.070 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:18.065.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:18.065.486 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:23.068.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:23.068.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:28.068.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:28.069.032 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:33.069.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:33.073.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:38.073.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:38.073.720 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:43.073.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:43.087.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:48.087.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:48.087.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:53.906.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:53.906.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:58.907.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:39:58.910.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:03.910.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:03.910.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:08.910.780 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:08.910.836 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:13.910.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:13.911.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:18.911.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:18.911.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:23.911.531 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:23.911.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:28.911.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:28.911.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:33.912.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:33.912.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:38.912.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:38.912.492 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:43.912.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:43.912.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:48.912.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:48.913.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:53.913.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:53.913.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:58.913.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:40:58.913.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:03.913.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:03.913.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:08.914.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:08.914.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:13.914.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:13.914.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:18.915.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:18.915.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:23.915.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:23.915.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:28.915.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:28.915.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:33.915.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:33.916.037 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:38.916.202 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:38.916.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:43.916.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:43.916.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:48.916.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:48.916.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:53.916.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:53.917.101 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:58.917.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:41:58.917.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:03.917.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:03.917.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:08.917.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:08.917.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:13.918.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:13.918.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:18.918.362 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:18.918.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:23.918.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:23.918.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:28.918.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:28.919.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:33.919.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:33.919.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:38.919.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:38.919.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:43.919.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:43.919.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:48.919.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:48.919.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:53.920.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:53.920.200 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:58.920.362 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:42:58.920.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:03.920.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:03.920.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:08.920.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:08.920.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:13.921.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:13.921.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:18.921.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:18.921.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:23.921.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:23.921.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:28.921.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:28.921.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:33.922.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:33.922.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:38.922.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:38.923.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:43.923.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:43.923.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:48.923.426 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:48.923.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:53.923.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:53.923.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:58.923.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:43:58.923.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:03.924.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:03.924.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:08.924.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:08.924.474 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:13.924.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:13.924.703 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:18.924.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:18.924.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:23.925.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:23.925.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:28.925.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:28.925.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:33.925.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:33.925.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:38.925.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:38.926.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:43.926.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:43.926.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:48.926.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:48.927.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:53.927.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:53.927.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:58.927.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:44:58.927.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:03.927.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:03.927.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:08.927.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:08.928.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:13.928.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:13.928.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:18.929.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:18.929.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:23.929.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:23.929.523 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:28.929.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:28.929.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:33.929.921 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:33.930.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:38.930.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:38.930.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:43.930.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:43.930.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:48.930.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:48.930.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:53.930.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:53.931.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:58.931.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:45:58.931.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:03.931.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:03.931.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:08.931.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:08.931.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:13.931.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:13.932.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:18.932.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:18.932.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:23.932.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:23.932.454 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:28.932.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:28.932.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:33.932.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:33.932.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:38.933.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:38.933.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:43.933.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:43.933.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:48.933.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:48.933.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:53.933.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:53.933.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:58.934.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:46:58.934.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:03.934.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:03.934.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:08.934.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:08.934.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:13.934.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:13.934.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:18.935.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:18.935.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:23.935.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:23.935.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:28.935.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:28.936.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:33.936.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:33.936.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:38.936.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:38.936.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:43.936.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:43.936.932 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:48.937.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:48.937.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:53.937.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:53.937.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:58.937.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:47:58.937.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:03.937.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:03.937.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:08.938.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:08.938.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:13.938.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:13.938.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:18.938.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:18.938.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:23.938.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:23.938.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:28.939.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:28.939.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:33.939.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:33.939.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:38.939.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:38.939.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:43.939.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:43.939.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:48.939.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:48.940.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:53.940.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:53.940.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:58.940.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:48:58.940.538 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:03.940.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:03.940.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:08.940.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:08.941.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:13.941.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:13.941.365 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:18.941.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:18.941.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:23.941.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:23.941.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:28.941.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:28.942.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:33.942.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:33.943.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:38.943.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:38.943.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:43.944.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:43.944.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:48.944.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:48.944.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:53.944.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:53.944.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:58.944.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:49:58.944.757 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:03.944.921 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:03.945.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:08.945.157 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:08.945.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:13.945.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:13.945.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:18.945.688 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:18.945.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:23.945.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:23.946.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:28.946.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:28.946.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:33.946.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:33.946.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:38.946.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:38.946.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:43.946.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:43.947.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:48.947.163 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:48.947.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:53.947.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:53.947.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:58.947.625 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:50:58.948.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:03.948.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:03.948.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:08.948.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:08.948.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:13.948.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:13.949.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:18.949.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:18.949.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:23.949.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:23.949.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:28.949.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:28.949.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:33.949.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:33.949.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:38.950.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:38.950.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:43.950.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:43.950.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:48.950.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:48.950.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:53.950.707 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:53.950.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:58.950.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:51:58.950.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:03.951.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:03.951.234 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:08.951.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:08.951.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:13.951.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:13.951.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:18.951.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:18.951.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:23.952.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:23.952.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:28.953.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:28.953.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:33.953.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:33.953.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:38.953.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:38.953.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:43.953.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:43.953.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:48.954.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:48.954.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:53.954.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:53.954.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:58.954.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:52:58.954.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:03.954.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:03.954.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:08.954.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:08.955.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:13.955.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:13.955.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:18.955.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:18.955.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:23.955.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:23.955.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:28.955.884 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:28.955.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:33.956.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:33.956.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:38.956.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:38.956.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:43.956.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:43.956.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:48.956.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:48.957.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:53.957.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:53.957.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:58.957.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:53:58.957.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:03.957.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:03.957.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:08.957.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:08.958.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:13.958.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:13.958.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:18.958.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:18.958.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:23.958.719 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:23.958.785 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:28.958.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:28.959.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:33.959.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:33.959.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:38.959.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:38.959.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:43.959.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:43.959.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:48.959.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:48.960.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:53.960.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:53.960.243 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:58.960.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:54:58.960.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:03.960.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:03.960.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:08.960.900 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:08.961.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:13.961.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:13.961.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:18.962.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:18.962.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:23.962.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:23.962.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:28.962.630 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:28.962.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:33.962.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:33.962.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:38.963.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:38.963.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:43.963.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:43.963.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:48.963.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:48.963.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:53.963.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:53.963.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:58.964.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:55:58.964.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:03.964.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:03.964.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:08.964.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:08.964.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:13.964.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:13.964.867 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:18.965.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:18.965.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:23.965.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:23.965.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:28.965.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:28.965.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:33.965.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:33.965.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:38.965.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:38.966.057 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:43.966.203 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:43.966.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:48.966.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:48.966.492 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:53.966.649 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:53.966.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:58.966.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:56:58.966.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:03.967.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:03.967.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:08.967.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:08.967.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:13.967.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:13.967.632 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:18.967.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:18.968.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:23.968.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:23.968.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:28.968.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:28.969.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:33.969.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:33.969.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:38.970.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:38.970.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:43.971.072 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:43.971.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:48.971.295 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:48.971.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:53.971.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:53.971.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:58.971.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:57:58.971.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:03.971.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:03.972.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:08.972.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:08.972.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:13.972.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:13.973.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:18.973.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:18.973.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:23.973.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:23.973.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:28.973.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:28.973.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:33.973.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:33.973.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:38.973.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:38.974.056 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:43.974.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:43.975.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:48.975.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:48.975.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:53.975.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:53.975.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:58.975.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:58:58.975.701 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:03.975.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:03.975.920 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:08.976.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:08.976.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:13.976.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:13.976.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:18.976.531 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:18.976.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:23.976.759 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:23.976.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:28.976.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:28.977.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:33.977.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:33.977.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:38.977.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:38.977.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:43.977.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:43.977.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:48.977.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:48.978.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:53.978.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:53.978.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:58.978.416 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-19:59:58.978.495 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:03.978.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:03.978.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:08.978.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:08.978.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:13.979.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:13.979.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:18.979.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:18.979.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:23.979.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:23.979.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:28.979.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:28.979.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:33.979.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:33.980.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:38.980.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:38.980.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:43.980.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:43.980.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:48.980.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:48.980.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:53.981.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:53.981.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:58.982.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:00:58.982.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:03.982.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:03.982.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:08.982.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:08.982.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:13.982.743 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:13.982.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:18.982.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:18.983.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:23.983.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:23.983.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:28.983.416 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:28.983.492 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:33.983.673 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:33.983.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:38.983.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:38.983.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:43.984.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:43.984.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:48.984.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:48.984.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:53.984.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:53.984.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:58.984.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:01:58.984.845 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:03.984.997 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:03.985.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:08.985.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:08.985.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:13.985.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:13.986.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:18.986.457 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:18.986.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:23.986.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:23.986.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:28.986.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:28.986.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:33.987.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:33.987.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:38.987.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:38.987.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:43.987.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:43.987.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:48.987.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:48.987.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:53.987.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:53.988.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:58.988.221 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:02:58.988.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:03.988.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:03.988.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:08.988.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:08.988.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:13.988.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:13.989.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:18.989.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:18.989.280 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:23.989.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:23.989.495 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:28.989.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:28.989.721 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:33.989.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:33.989.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:38.990.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:38.990.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:43.990.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:43.990.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:48.990.546 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:48.990.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:53.990.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:53.990.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:58.990.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:03:58.991.064 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:03.991.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:03.991.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:08.991.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:08.991.511 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:13.991.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:13.991.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:18.991.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:18.991.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:23.992.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:23.992.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:28.992.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:28.992.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:33.992.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:33.992.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:38.992.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:38.992.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:43.992.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:43.993.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:48.993.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:48.993.234 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:53.993.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:53.993.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:58.993.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:04:58.993.679 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:03.993.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:03.993.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:08.994.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:08.994.133 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:13.994.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:13.994.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:18.995.129 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:18.995.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:23.995.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:23.995.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:28.995.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:28.995.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:33.996.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:33.996.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:38.996.627 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:38.996.686 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:43.996.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:43.996.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:48.997.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:48.997.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:53.997.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:53.997.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:58.997.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:05:58.997.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:03.997.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:03.997.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:08.997.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:08.998.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:13.998.158 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:13.998.222 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:18.998.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:18.998.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:23.998.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:23.998.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:28.998.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:28.998.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:33.999.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:33.999.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:38.999.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:38.999.401 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:43.999.551 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:43.999.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:48.999.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:48.999.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:53.999.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:54.000.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:59.000.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:06:59.000.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:04.000.432 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:04.000.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:09.000.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:09.000.724 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:14.000.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:14.000.961 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:19.001.109 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:19.001.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:24.001.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:24.001.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:29.001.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:29.001.702 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:34.001.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:34.001.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:39.002.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:39.002.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:44.002.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:44.002.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:49.002.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:49.002.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:54.002.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:54.002.781 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:59.002.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:07:59.003.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:04.003.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:04.003.215 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:09.003.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:09.003.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:14.003.649 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:14.003.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:19.003.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:19.003.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:24.004.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:24.004.127 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:29.004.280 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:29.004.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:34.004.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:34.005.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:39.005.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:39.005.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:44.005.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:44.005.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:49.005.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:49.005.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:54.006.115 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:54.006.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:59.006.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:08:59.006.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:04.006.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:04.006.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:09.006.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:09.006.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:14.007.025 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:14.007.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:19.007.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:19.007.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:24.007.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:24.007.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:29.007.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:29.007.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:34.007.926 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:34.007.989 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:39.008.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:39.008.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:44.008.348 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:44.008.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:49.008.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:49.008.629 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:54.008.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:54.008.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:59.008.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:09:59.009.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:04.009.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:04.009.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:09.009.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:09.009.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:14.010.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:14.010.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:19.010.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:19.010.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:24.010.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:24.010.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:29.011.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:29.011.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:34.011.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:34.011.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:39.011.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:39.011.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:44.011.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:44.011.871 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:49.012.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:49.012.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:54.012.222 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:54.012.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:59.012.432 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:10:59.012.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:04.012.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:04.012.760 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:09.012.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:09.012.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:14.013.131 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:14.013.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:19.013.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:19.013.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:24.013.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:24.013.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:29.013.780 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:29.013.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:34.014.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:34.014.058 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:39.014.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:39.014.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:44.014.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:44.014.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:49.014.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:49.014.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:54.014.866 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:54.014.927 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:59.015.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:11:59.015.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:04.015.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:04.015.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:09.015.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:09.015.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:14.015.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:14.015.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:19.015.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:19.016.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:24.016.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:24.016.302 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:29.016.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:29.016.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:34.016.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:34.016.742 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:39.016.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:39.016.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:44.017.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:44.017.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:49.017.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:49.017.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:54.017.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:54.017.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:59.017.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:12:59.017.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:04.018.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:04.018.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:09.018.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:09.018.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:14.018.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:14.019.785 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:19.019.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:19.020.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:24.020.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:24.020.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:29.020.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:29.020.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:34.020.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:34.024.058 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:39.024.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:39.024.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:44.024.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:44.024.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:49.024.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:49.024.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:54.024.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:54.028.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:59.028.596 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:13:59.030.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:04.030.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:04.030.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:09.031.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:09.031.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:14.044.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:14.044.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:19.045.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:19.046.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:24.046.765 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:24.046.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:29.086.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:29.086.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:34.087.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:34.087.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:39.090.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:39.090.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:44.094.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:44.094.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:49.094.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:49.094.368 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:54.095.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:54.096.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:59.096.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:14:59.097.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:04.097.264 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:04.101.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:09.101.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:09.101.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:14.101.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:14.102.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:19.129.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:19.129.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:24.129.971 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:24.130.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:29.130.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:29.130.246 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:34.130.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:34.130.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:39.130.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:39.130.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:44.130.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:44.130.943 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:49.131.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:49.131.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:54.131.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:54.131.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:59.131.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:15:59.131.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:04.131.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:04.131.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:09.131.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:09.132.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:14.132.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:14.132.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:19.132.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:19.133.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:24.133.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:24.133.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:29.133.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:29.133.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:34.133.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:34.133.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:39.133.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:39.133.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:44.134.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:44.134.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:49.134.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:49.134.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:54.135.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:54.135.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:59.135.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:16:59.135.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:04.135.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:04.135.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:09.135.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:09.136.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:14.136.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:14.136.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:19.136.457 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:19.136.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:24.136.688 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:24.136.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:29.136.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:29.136.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:34.137.129 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:34.137.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:39.137.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:39.137.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:44.137.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:44.138.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:49.138.608 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:49.138.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:54.138.853 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:54.138.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:59.139.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:17:59.139.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:04.139.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:04.139.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:09.139.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:09.139.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:14.139.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:14.139.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:19.139.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:19.140.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:24.140.214 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:24.140.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:29.140.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:29.140.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:34.140.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:34.140.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:39.140.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:39.141.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:44.141.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:44.141.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:49.141.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:49.141.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:54.141.656 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:54.141.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:59.141.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:18:59.141.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:04.142.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:04.142.171 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:09.142.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:09.143.023 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:14.143.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:14.143.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:19.143.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:19.143.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:24.143.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:24.143.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:29.143.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:29.143.961 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:34.144.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:34.144.234 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:39.144.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:39.144.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:44.144.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:44.144.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:49.144.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:49.144.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:54.145.126 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:54.145.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:59.145.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:19:59.145.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:04.145.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:04.146.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:09.146.446 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:09.146.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:14.146.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:14.146.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:19.146.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:19.147.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:24.147.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:24.147.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:29.147.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:29.147.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:34.147.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:34.147.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:39.149.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:39.149.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:44.149.280 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:44.149.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:49.149.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:49.149.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:54.149.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:54.149.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:59.149.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:20:59.150.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:04.150.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:04.150.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:09.150.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:09.150.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:14.150.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:14.150.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:19.151.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:19.151.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:24.151.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:24.151.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:29.151.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:29.151.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:34.151.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:34.151.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:39.151.983 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:39.152.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:44.152.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:44.152.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:49.152.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:49.152.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:54.152.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:54.152.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:59.153.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:21:59.153.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:04.153.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:04.153.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:09.153.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:09.153.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:14.153.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:14.153.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:19.153.925 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:19.153.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:24.154.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:24.154.192 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:29.154.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:29.154.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:34.154.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:34.154.652 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:39.154.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:39.154.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:44.155.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:44.155.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:49.155.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:49.155.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:54.155.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:54.155.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:59.155.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:22:59.155.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:04.155.960 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:04.156.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:09.156.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:09.156.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:14.156.413 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:14.156.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:19.156.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:19.156.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:24.156.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:24.156.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:29.157.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:29.157.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:34.157.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:34.157.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:39.157.545 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:39.157.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:44.157.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:44.157.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:49.158.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:49.158.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:54.158.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:54.158.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:59.158.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:23:59.158.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:04.158.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:04.158.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:09.158.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:09.159.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:14.159.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:14.159.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:19.159.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:19.159.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:24.159.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:24.159.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:29.159.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:29.159.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:34.160.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:34.160.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:39.160.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:39.160.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:44.160.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:44.160.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:49.160.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:49.160.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:54.161.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:54.161.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:59.161.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:24:59.161.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:04.161.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:04.161.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:09.161.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:09.161.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:14.162.050 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:14.162.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:19.162.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:19.162.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:24.162.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:24.162.591 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:29.162.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:29.163.511 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:34.163.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:34.163.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:39.163.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:39.163.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:44.164.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:44.164.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:49.164.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:49.164.402 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:54.164.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:54.164.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:59.164.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:25:59.164.845 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:04.164.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:04.165.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:09.165.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:09.165.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:14.165.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:14.165.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:19.165.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:19.165.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:24.165.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:24.166.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:29.166.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:29.166.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:34.166.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:34.166.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:39.166.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:39.166.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:44.166.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:44.166.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:49.167.058 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:49.167.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:54.167.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:54.167.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:59.167.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:26:59.167.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:04.167.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:04.167.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:09.167.907 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:09.167.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:14.168.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:14.168.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:19.168.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:19.168.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:24.168.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:24.168.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:29.168.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:29.168.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:34.168.960 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:34.169.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:39.169.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:39.169.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:44.169.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:44.169.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:49.169.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:49.169.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:54.169.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:54.169.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:59.170.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:27:59.170.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:04.170.360 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:04.170.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:09.170.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:09.170.632 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:14.170.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:14.170.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:19.171.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:19.171.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:24.171.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:24.171.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:29.171.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:29.171.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:34.171.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:34.171.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:39.171.936 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:39.172.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:44.172.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:44.172.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:49.172.371 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:49.172.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:54.172.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:54.172.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:59.172.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:28:59.173.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:04.173.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:04.173.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:09.173.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:09.173.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:14.174.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:14.174.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:19.174.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:19.174.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:24.174.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:24.174.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:29.174.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:29.174.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:34.174.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:34.174.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:39.175.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:39.175.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:44.175.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:44.175.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:49.175.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:49.175.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:54.175.765 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:54.175.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:59.175.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:29:59.176.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:04.176.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:04.176.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:09.176.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:09.176.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:14.176.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:14.176.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:19.176.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:19.176.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:24.177.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:24.177.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:29.177.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:29.177.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:34.177.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:34.177.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:39.177.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:39.177.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:44.177.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:44.178.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:49.178.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:49.178.237 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:54.178.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:54.178.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:59.178.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:30:59.178.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:04.178.788 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:04.178.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:09.179.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:09.179.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:14.179.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:14.179.298 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:19.179.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:19.179.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:24.179.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:24.179.730 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:29.179.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:29.179.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:34.180.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:34.180.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:39.180.295 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:39.180.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:44.180.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:44.180.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:49.180.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:49.180.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:54.181.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:54.181.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:59.181.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:31:59.181.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:04.181.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:04.181.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:09.181.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:09.181.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:14.181.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:14.181.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:19.182.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:19.182.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:24.182.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:24.182.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:29.182.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:29.182.644 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:34.182.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:34.182.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:39.183.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:39.183.110 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:44.183.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:44.183.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:49.183.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:49.183.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:54.183.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:54.183.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:59.183.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:32:59.183.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:04.184.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:04.184.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:09.184.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:09.184.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:14.184.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:14.186.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:19.186.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:19.186.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:24.186.426 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:24.186.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:29.186.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:29.186.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:34.186.870 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:34.186.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:39.187.082 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:39.187.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:44.187.296 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:44.187.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:49.187.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:49.187.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:54.187.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:54.188.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:59.188.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:33:59.188.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:04.188.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:04.189.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:09.189.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:09.189.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:14.189.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:14.189.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:19.189.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:19.189.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:24.189.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:24.189.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:29.190.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:29.190.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:34.190.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:34.190.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:39.190.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:39.190.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:44.190.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:44.190.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:49.190.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:49.191.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:54.191.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:54.191.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:59.191.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:34:59.191.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:04.191.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:04.191.724 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:09.191.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:09.191.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:14.192.108 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:14.192.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:19.192.345 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:19.192.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:24.193.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:24.193.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:29.193.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:29.193.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:34.193.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:34.193.580 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:39.194.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:39.194.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:44.194.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:44.194.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:49.195.389 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:49.195.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:54.195.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:54.195.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:59.195.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:35:59.195.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:04.196.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:04.196.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:09.196.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:09.196.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:14.197.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:14.197.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:19.197.406 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:19.197.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:24.197.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:24.197.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:29.197.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:29.197.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:34.198.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:34.198.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:39.198.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:39.198.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:44.198.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:44.198.671 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:49.198.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:49.198.857 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:54.199.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:54.199.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:59.199.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:36:59.199.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:04.199.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:04.199.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:09.199.655 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:09.199.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:14.199.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:14.200.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:19.200.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:19.200.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:24.200.371 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:24.200.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:29.200.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:29.200.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:34.200.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:34.200.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:39.201.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:39.201.171 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:44.201.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:44.201.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:49.201.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:49.201.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:54.201.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:54.201.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:59.201.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:37:59.202.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:04.202.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:04.202.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:09.202.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:09.202.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:14.202.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:14.202.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:19.202.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:19.202.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:24.203.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:24.203.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:29.203.347 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:29.203.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:34.203.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:34.203.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:39.203.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:39.203.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:44.203.971 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:44.204.057 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:49.204.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:49.204.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:54.204.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:54.204.511 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:59.205.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:38:59.205.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:04.205.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:04.205.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:09.205.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:09.205.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:14.205.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:14.206.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:19.206.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:19.206.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:24.206.390 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:24.206.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:29.206.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:29.206.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:34.206.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:34.206.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:39.207.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:39.207.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:44.207.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:44.207.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:49.207.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:49.207.556 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:54.207.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:54.207.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:59.207.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:39:59.207.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:04.208.126 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:04.208.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:09.208.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:09.208.433 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:14.208.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:14.209.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:19.209.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:19.209.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:24.209.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:24.209.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:29.209.938 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:29.210.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:34.210.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:34.210.224 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:39.210.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:39.210.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:44.210.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:44.210.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:49.210.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:49.210.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:54.211.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:54.211.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:59.211.273 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:40:59.211.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:04.211.495 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:04.211.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:09.211.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:09.211.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:14.211.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:14.212.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:19.212.168 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:19.212.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:24.212.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:24.212.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:29.212.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:29.212.701 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:34.212.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:34.212.903 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:39.213.058 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:39.213.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:44.213.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:44.213.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:49.213.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:49.213.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:54.213.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:54.213.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:59.213.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:41:59.214.023 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:04.214.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:04.214.219 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:09.214.371 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:09.214.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:14.214.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:14.214.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:19.214.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:19.214.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:24.215.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:24.215.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:29.215.345 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:29.215.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:34.215.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:34.215.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:39.215.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:39.215.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:44.215.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:44.216.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:49.216.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:49.216.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:54.216.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:54.216.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:59.216.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:42:59.216.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:04.216.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:04.217.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:09.217.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:09.217.783 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:14.217.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:14.217.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:19.218.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:19.218.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:24.218.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:24.218.448 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:29.218.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:29.218.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:34.218.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:34.218.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:39.219.033 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:39.219.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:44.219.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:44.219.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:49.219.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:49.219.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:54.219.736 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:54.219.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:59.219.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:43:59.220.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:04.220.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:04.220.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:09.220.374 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:09.220.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:14.220.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:14.220.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:19.220.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:19.220.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:24.221.007 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:24.221.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:29.221.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:29.221.322 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:34.221.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:34.221.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:39.221.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:39.221.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:44.221.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:44.221.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:49.222.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:49.222.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:54.222.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:54.222.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:59.222.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:44:59.222.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:04.222.752 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:04.222.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:09.222.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:09.223.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:14.223.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:14.223.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:19.223.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:19.223.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:24.223.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:24.223.727 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:29.223.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:29.223.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:34.224.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:34.224.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:39.224.338 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:39.224.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:44.224.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:44.224.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:49.224.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:49.224.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:54.225.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:54.225.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:59.225.871 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:45:59.225.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:04.226.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:04.226.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:09.226.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:09.226.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:14.227.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:14.227.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:19.227.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:19.227.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:24.228.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:24.228.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:29.228.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:29.228.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:34.228.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:34.228.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:39.228.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:39.228.779 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:44.228.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:44.228.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:49.229.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:49.229.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:54.229.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:54.229.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:59.230.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:46:59.230.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:04.230.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:04.230.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:09.230.619 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:09.230.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:14.231.374 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:14.231.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:19.231.615 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:19.231.671 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:24.231.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:24.231.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:29.232.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:29.232.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:34.232.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:34.232.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:39.233.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:39.233.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:44.233.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:44.233.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:49.233.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:49.233.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:54.233.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:54.233.812 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:59.233.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:47:59.234.210 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:04.234.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:04.234.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:09.234.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:09.234.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:14.234.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:14.235.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:19.236.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:19.236.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:24.236.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:24.236.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:29.236.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:29.236.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:34.236.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:34.239.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:39.239.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:39.239.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:44.239.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:44.239.701 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:49.239.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:49.239.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:54.240.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:54.240.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:59.240.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:48:59.241.982 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:04.242.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:04.242.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:09.247.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:09.248.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:14.248.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:14.248.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:19.248.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:19.248.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:24.261.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:25.077.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:30.077.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:30.077.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:35.077.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:35.079.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:40.079.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:40.079.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:45.092.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:45.097.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:50.097.509 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:50.098.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:55.098.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:49:55.098.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:00.102.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:00.104.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:05.104.678 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:05.105.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:10.105.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:10.105.363 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:15.105.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:15.105.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:20.105.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:20.105.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:25.105.958 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:25.106.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:30.106.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:30.106.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:35.106.370 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:35.106.456 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:40.106.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:40.106.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:45.106.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:45.106.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:50.107.037 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:50.108.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:55.108.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:50:55.108.324 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:00.109.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:00.109.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:05.109.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:05.109.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:10.109.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:10.109.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:15.109.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:15.109.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:20.109.897 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:20.109.980 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:25.110.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:25.110.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:30.110.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:30.110.392 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:35.111.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:35.111.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:40.112.577 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:40.112.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:45.112.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:45.112.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:50.112.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:50.113.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:55.113.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:51:55.113.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:00.113.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:00.114.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:05.114.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:05.114.262 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:10.114.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:10.114.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:15.114.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:15.114.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:20.114.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:20.114.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:25.115.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:25.115.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:30.115.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:30.115.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:35.115.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:35.115.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:40.115.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:40.115.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:45.115.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:45.115.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:50.116.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:50.116.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:55.116.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:52:55.116.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:00.116.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:00.116.636 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:05.116.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:05.116.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:10.116.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:10.117.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:15.117.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:15.117.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:20.118.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:20.118.226 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:25.118.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:25.118.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:30.118.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:30.118.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:35.118.823 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:35.118.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:40.119.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:40.119.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:45.120.013 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:45.120.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:50.120.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:50.120.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:55.120.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:53:55.120.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:00.120.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:00.120.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:05.120.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:05.120.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:10.121.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:10.121.140 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:15.121.270 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:15.121.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:20.121.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:20.121.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:25.121.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:25.121.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:30.121.900 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:30.121.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:35.122.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:35.122.161 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:40.122.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:40.122.366 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:45.122.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:45.122.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:50.122.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:50.122.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:55.122.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:54:55.123.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:00.123.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:00.123.237 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:05.123.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:05.123.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:10.123.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:10.123.673 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:15.123.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:15.123.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:20.124.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:20.124.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:25.124.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:25.124.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:30.124.432 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:30.124.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:35.124.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:35.124.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:40.124.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:40.124.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:45.125.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:45.125.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:50.125.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:50.126.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:55.126.199 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:55:55.126.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:00.126.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:00.126.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:05.126.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:05.126.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:10.126.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:10.126.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:15.127.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:15.127.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:20.127.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:20.127.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:25.128.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:25.128.799 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:30.128.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:30.129.032 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:35.129.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:35.129.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:40.129.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:40.129.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:45.129.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:45.129.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:50.129.821 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:50.129.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:55.130.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:56:55.130.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:00.130.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:00.130.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:05.130.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:05.130.520 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:10.130.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:10.131.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:15.132.133 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:15.132.192 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:20.132.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:20.132.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:25.132.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:25.132.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:30.132.746 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:30.132.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:35.132.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:35.133.005 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:40.133.160 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:40.133.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:45.134.061 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:45.134.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:50.134.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:50.134.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:55.134.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:57:55.134.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:00.134.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:00.134.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:05.134.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:05.134.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:10.135.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:10.135.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:15.135.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:15.135.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:20.135.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:20.135.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:25.135.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:25.135.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:30.135.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:30.136.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:35.136.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:35.136.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:40.136.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:40.137.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:45.137.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:45.137.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:50.137.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:50.137.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:55.137.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:58:55.137.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:00.137.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:00.137.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:05.138.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:05.138.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:10.138.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:10.138.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:15.138.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:15.138.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:20.138.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:20.138.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:25.138.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:25.139.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:30.139.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:30.139.208 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:35.139.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:35.139.417 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:40.140.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:40.140.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:45.140.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:45.140.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:50.140.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:50.140.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:55.141.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-20:59:55.141.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:00.141.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:00.141.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:05.141.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:05.141.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:10.141.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:10.141.836 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:15.141.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:15.142.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:20.142.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:20.142.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:25.142.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:25.142.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:30.142.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:30.142.673 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:35.142.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:35.142.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:40.143.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:40.143.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:45.143.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:45.143.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:50.143.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:50.143.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:55.143.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:00:55.143.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:00.143.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:00.144.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:05.144.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:05.144.243 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:10.144.381 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:10.144.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:15.144.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:15.144.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:20.144.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:20.144.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:25.145.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:25.145.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:30.145.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:30.145.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:35.145.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:35.145.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:40.146.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:40.146.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:45.146.438 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:45.146.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:50.146.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:50.146.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:55.146.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:01:55.146.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:00.147.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:00.147.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:05.147.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:05.148.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:10.148.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:10.148.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:15.148.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:15.148.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:20.148.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:20.148.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:25.148.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:25.148.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:30.149.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:30.149.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:35.149.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:35.149.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:40.149.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:40.149.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:45.149.779 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:45.149.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:50.150.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:50.150.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:55.150.243 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:02:55.150.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:00.150.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:00.150.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:05.150.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:05.150.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:10.150.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:10.150.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:15.151.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:15.151.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:20.151.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:20.151.356 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:25.151.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:25.151.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:30.151.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:30.152.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:35.152.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:35.152.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:40.152.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:40.152.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:45.152.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:45.153.037 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:50.153.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:50.153.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:55.153.401 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:03:55.153.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:00.154.254 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:00.154.313 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:05.154.465 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:05.154.552 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:10.154.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:10.154.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:15.154.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:15.154.989 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:20.155.116 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:20.155.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:25.155.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:25.155.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:30.155.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:30.155.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:35.155.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:35.155.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:40.155.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:40.155.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:45.156.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:45.156.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:50.156.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:50.156.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:55.156.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:04:55.156.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:00.156.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:00.156.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:05.156.926 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:05.156.983 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:10.157.134 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:10.157.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:15.157.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:15.157.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:20.158.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:20.158.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:25.158.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:25.158.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:30.158.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:30.158.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:35.158.743 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:35.158.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:40.158.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:40.159.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:45.159.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:45.159.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:50.159.383 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:50.159.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:55.159.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:05:55.159.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:00.159.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:00.159.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:05.160.010 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:05.160.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:10.160.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:10.160.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:15.160.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:15.160.543 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:20.161.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:20.161.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:25.161.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:25.161.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:30.161.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:30.161.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:35.162.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:35.162.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:40.162.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:40.162.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:45.162.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:45.162.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:50.162.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:50.162.679 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:55.162.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:06:55.162.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:00.163.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:00.163.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:05.163.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:05.163.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:10.164.124 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:10.164.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:15.164.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:15.164.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:20.164.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:20.164.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:25.165.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:25.165.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:30.165.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:30.165.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:35.165.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:35.165.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:40.165.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:40.166.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:45.166.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:45.166.278 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:50.166.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:50.166.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:55.166.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:07:55.166.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:00.166.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:00.166.896 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:05.167.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:05.167.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:10.167.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:10.167.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:15.167.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:15.167.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:20.167.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:20.167.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:25.167.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:25.167.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:30.168.087 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:30.168.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:35.168.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:35.168.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:40.168.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:40.168.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:45.168.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:45.168.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:50.168.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:50.168.927 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:55.169.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:08:55.169.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:00.169.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:00.169.369 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:05.169.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:05.169.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:10.169.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:10.169.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:15.169.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:15.170.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:20.170.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:20.170.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:25.170.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:25.170.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:30.170.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:30.170.610 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:35.170.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:35.170.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:40.170.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:40.171.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:45.171.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:45.171.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:50.171.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:50.171.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:55.171.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:09:55.171.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:00.171.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:00.171.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:05.172.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:05.172.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:10.172.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:10.172.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:15.173.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:15.173.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:20.173.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:20.173.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:25.173.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:25.173.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:30.173.711 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:30.173.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:35.173.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:35.174.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:40.174.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:40.174.214 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:45.174.361 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:45.174.422 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:50.174.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:50.174.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:55.174.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:10:55.174.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:00.174.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:00.175.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:05.175.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:05.175.237 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:10.175.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:10.175.474 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:15.175.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:15.175.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:20.175.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:20.175.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:25.176.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:25.176.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:30.176.243 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:30.176.298 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:35.176.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:35.176.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:40.176.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:40.176.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:45.176.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:45.176.894 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:50.177.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:50.177.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:55.177.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:11:55.177.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:00.177.507 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:00.177.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:05.177.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:05.177.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:10.177.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:10.177.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:15.178.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:15.178.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:20.178.291 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:20.178.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:25.179.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:25.179.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:30.179.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:30.179.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:35.179.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:35.179.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:40.179.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:40.179.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:45.180.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:45.180.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:50.180.310 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:50.180.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:55.181.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:12:55.181.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:00.181.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:00.181.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:05.182.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:05.182.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:10.182.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:10.182.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:15.182.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:15.182.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:20.182.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:20.182.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:25.182.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:25.182.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:30.183.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:30.183.122 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:35.183.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:35.183.321 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:40.184.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:40.184.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:45.184.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:45.184.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:50.184.553 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:50.184.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:55.184.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:13:55.184.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:00.184.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:00.185.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:05.185.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:05.185.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:10.185.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:10.185.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:15.185.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:15.185.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:20.185.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:20.185.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:25.186.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:25.186.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:30.186.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:30.186.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:35.187.005 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:35.187.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:40.187.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:40.187.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:45.187.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:45.187.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:50.187.673 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:50.187.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:55.187.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:14:55.187.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:00.188.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:00.188.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:05.188.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:05.188.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:10.188.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:10.188.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:15.188.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:15.188.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:20.188.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:20.189.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:25.189.203 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:25.189.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:30.189.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:30.189.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:35.189.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:35.189.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:40.190.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:40.190.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:45.190.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:45.190.652 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:50.190.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:50.190.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:55.191.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:15:55.191.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:00.191.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:00.191.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:05.191.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:05.191.533 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:10.191.686 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:10.192.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:15.192.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:15.192.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:20.193.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:20.193.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:25.193.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:25.193.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:30.193.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:30.193.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:35.193.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:35.194.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:40.194.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:40.194.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:45.194.444 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:45.194.505 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:50.194.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:50.194.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:55.194.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:16:55.194.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:00.195.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:00.195.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:05.195.297 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:05.195.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:10.195.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:10.195.580 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:15.195.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:15.195.791 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:20.196.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:20.196.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:25.196.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:25.196.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:30.196.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:30.197.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:35.197.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:35.197.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:40.197.528 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:40.197.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:45.197.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:45.197.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:50.197.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:50.198.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:55.198.153 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:17:55.198.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:00.198.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:00.198.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:05.198.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:05.198.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:10.198.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:10.198.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:15.199.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:15.199.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:20.199.280 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:20.199.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:25.200.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:25.200.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:30.200.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:30.200.464 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:35.200.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:35.200.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:40.200.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:40.200.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:45.201.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:45.201.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:50.201.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:50.201.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:55.201.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:18:55.201.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:00.201.742 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:00.201.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:05.201.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:05.202.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:10.202.164 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:10.202.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:15.202.369 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:15.202.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:20.202.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:20.202.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:25.202.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:25.202.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:30.202.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:30.203.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:35.203.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:35.203.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:40.203.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:40.204.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:45.204.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:45.204.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:50.204.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:50.204.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:55.204.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:19:55.204.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:00.204.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:00.204.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:05.205.115 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:05.205.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:10.205.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:10.205.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:15.205.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:15.205.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:20.205.736 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:20.205.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:25.205.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:25.206.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:30.206.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:30.206.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:35.206.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:35.206.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:40.206.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:40.206.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:45.206.897 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:45.206.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:50.207.109 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:50.207.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:55.207.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:20:55.207.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:00.207.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:00.207.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:05.207.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:05.208.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:10.208.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:10.208.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:15.208.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:15.209.037 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:20.209.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:20.209.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:25.209.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:25.209.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:30.209.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:30.209.679 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:35.209.832 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:35.209.889 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:40.210.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:40.210.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:45.210.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:45.210.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:50.210.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:50.210.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:55.210.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:21:55.210.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:00.210.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:00.210.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:05.211.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:05.211.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:10.211.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:10.211.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:15.211.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:15.211.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:20.211.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:20.211.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:25.211.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:25.212.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:30.212.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:30.212.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:35.212.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:35.213.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:40.213.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:40.213.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:45.213.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:45.213.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:50.213.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:50.213.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:55.213.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:22:55.213.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:00.214.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:00.214.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:05.214.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:05.214.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:10.214.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:10.214.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:15.214.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:15.216.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:20.216.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:20.223.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:25.223.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:25.223.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:30.223.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:30.223.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:35.224.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:35.224.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:40.224.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:40.224.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:45.225.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:45.231.857 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:50.232.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:50.232.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:55.232.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:23:55.232.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:00.232.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:00.233.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:05.233.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:05.234.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:10.234.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:10.234.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:15.244.531 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:15.245.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:20.245.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:20.245.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:25.247.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:25.247.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:30.247.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:30.253.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:35.253.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:35.254.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:40.254.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:40.255.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:45.255.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:45.255.245 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:50.255.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:50.255.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:55.255.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:24:55.256.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:00.257.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:00.257.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:05.257.234 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:05.257.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:10.257.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:10.257.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:15.260.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:15.260.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:20.261.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:20.261.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:25.261.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:25.261.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:30.262.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:30.262.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:35.262.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:35.262.351 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:40.262.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:40.262.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:45.262.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:45.262.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:50.263.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:50.263.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:55.263.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:25:55.263.799 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:00.263.952 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:00.264.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:05.264.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:05.264.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:10.264.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:10.264.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:15.264.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:15.264.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:20.264.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:20.264.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:25.265.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:25.265.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:30.265.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:30.265.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:35.265.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:35.265.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:40.265.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:40.265.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:45.265.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:45.265.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:50.266.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:50.266.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:55.266.296 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:26:55.266.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:00.266.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:00.266.538 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:05.266.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:05.266.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:10.266.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:10.266.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:15.267.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:15.267.212 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:20.267.361 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:20.267.417 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:25.267.562 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:25.268.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:30.268.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:30.268.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:35.268.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:35.268.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:40.268.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:40.268.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:45.269.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:45.269.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:50.269.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:50.269.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:55.269.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:27:55.269.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:00.269.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:00.269.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:05.269.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:05.269.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:10.270.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:10.270.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:15.270.342 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:15.270.406 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:20.270.558 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:20.270.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:25.270.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:25.270.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:30.270.988 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:30.271.049 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:35.271.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:35.271.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:40.271.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:40.271.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:45.271.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:45.271.686 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:50.271.830 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:50.272.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:55.272.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:28:55.272.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:00.272.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:00.272.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:05.273.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:05.273.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:10.273.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:10.273.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:15.273.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:15.273.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:20.273.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:20.273.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:25.274.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:25.274.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:30.274.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:30.274.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:35.274.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:35.274.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:40.274.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:40.274.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:45.274.887 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:45.274.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:50.275.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:50.275.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:55.275.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:29:55.275.363 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:00.275.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:00.275.543 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:05.275.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:05.275.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:10.275.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:10.275.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:15.276.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:15.276.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:20.276.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:20.276.454 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:25.276.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:25.276.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:30.276.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:30.276.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:35.277.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:35.277.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:40.277.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:40.277.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:45.277.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:45.277.503 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:50.277.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:50.277.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:55.277.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:30:55.277.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:00.278.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:00.278.204 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:05.278.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:05.278.392 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:10.278.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:10.278.655 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:15.278.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:15.278.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:20.279.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:20.279.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:25.279.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:25.279.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:30.279.507 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:30.279.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:35.279.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:35.279.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:40.279.951 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:40.280.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:45.280.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:45.280.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:50.280.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:50.280.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:55.280.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:31:55.280.666 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:00.280.815 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:00.280.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:05.281.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:05.281.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:10.281.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:10.281.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:15.281.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:15.281.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:20.281.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:20.282.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:25.282.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:25.282.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:30.282.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:30.282.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:35.282.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:35.282.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:40.283.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:40.283.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:45.283.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:45.283.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:50.283.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:50.283.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:55.283.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:32:55.283.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:00.283.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:00.284.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:05.284.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:05.284.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:10.284.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:10.284.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:15.284.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:15.284.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:20.284.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:20.284.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:25.285.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:25.285.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:30.285.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:30.285.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:35.285.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:35.285.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:40.285.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:40.285.814 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:45.285.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:45.286.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:50.286.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:50.286.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:55.286.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:33:55.286.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:00.286.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:00.286.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:05.286.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:05.286.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:10.287.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:10.287.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:15.287.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:15.287.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:20.287.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:20.287.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:25.287.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:25.287.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:30.287.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:30.287.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:35.288.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:35.288.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:40.288.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:40.288.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:45.288.516 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:45.288.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:50.288.752 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:50.288.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:55.288.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:34:55.289.028 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:00.289.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:00.289.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:05.289.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:05.289.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:10.289.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:10.291.079 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:15.291.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:15.291.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:20.291.426 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:20.291.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:25.291.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:25.291.701 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:30.291.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:30.291.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:35.292.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:35.292.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:40.292.284 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:40.292.351 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:45.292.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:45.292.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:50.292.710 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:50.292.775 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:55.292.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:35:55.293.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:00.293.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:00.293.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:05.293.993 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:05.294.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:10.294.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:10.294.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:15.294.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:15.294.474 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:20.294.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:20.294.692 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:25.294.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:25.294.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:30.295.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:30.295.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:35.295.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:35.296.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:40.296.246 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:40.296.308 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:45.297.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:45.297.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:50.297.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:50.297.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:55.297.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:36:55.297.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:00.297.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:00.297.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:05.298.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:05.298.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:10.298.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:10.298.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:15.298.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:15.298.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:20.298.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:20.298.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:25.298.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:25.298.981 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:30.299.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:30.299.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:35.300.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:35.300.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:40.300.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:40.300.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:45.300.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:45.300.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:50.301.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:50.301.113 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:55.301.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:37:55.301.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:00.301.511 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:00.301.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:05.301.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:05.301.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:10.301.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:10.301.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:15.302.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:15.302.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:20.302.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:20.302.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:25.302.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:25.302.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:30.302.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:30.302.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:35.303.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:35.303.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:40.303.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:40.303.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:45.304.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:45.304.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:50.304.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:50.304.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:55.304.568 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:38:55.304.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:00.304.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:00.304.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:05.304.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:05.305.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:10.305.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:10.305.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:15.305.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:15.305.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:20.305.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:20.305.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:25.305.861 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:25.305.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:30.306.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:30.306.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:35.306.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:35.306.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:40.306.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:40.306.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:45.306.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:45.306.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:50.306.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:50.306.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:55.307.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:39:55.307.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:00.307.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:00.307.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:05.307.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:05.319.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:10.319.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:10.319.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:15.320.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:15.320.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:20.320.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:20.320.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:25.321.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:25.322.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:30.322.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:30.322.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:35.322.380 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:35.322.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:40.322.594 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:40.322.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:45.322.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:45.322.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:50.323.025 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:50.323.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:55.323.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:40:55.323.309 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:00.323.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:00.323.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:05.323.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:05.323.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:10.323.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:10.323.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:15.324.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:15.324.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:20.324.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:20.324.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:25.324.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:25.324.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:30.324.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:30.324.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:35.324.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:35.325.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:40.325.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:40.325.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:45.325.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:45.325.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:50.325.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:50.325.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:55.325.772 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:41:55.325.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:00.325.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:00.326.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:05.326.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:05.326.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:10.326.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:10.326.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:15.326.641 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:15.326.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:20.326.852 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:20.326.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:25.327.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:25.327.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:30.327.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:30.327.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:35.328.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:35.328.171 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:40.328.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:40.328.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:45.329.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:45.329.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:50.329.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:50.329.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:55.329.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:42:55.329.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:00.329.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:00.329.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:05.330.070 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:05.330.128 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:10.330.279 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:10.330.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:15.330.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:15.330.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:20.330.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:20.330.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:25.330.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:25.330.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:30.331.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:30.331.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:35.331.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:35.331.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:40.331.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:40.331.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:45.331.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:45.331.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:50.331.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:50.331.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:55.332.151 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:43:55.332.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:00.332.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:00.332.413 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:05.332.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:05.332.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:10.332.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:10.332.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:15.332.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:15.333.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:20.333.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:20.333.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:25.333.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:25.333.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:30.333.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:30.333.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:35.333.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:35.333.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:40.334.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:40.334.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:45.334.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:45.334.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:50.334.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:50.334.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:55.334.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:44:55.334.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:00.334.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:00.335.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:05.335.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:05.335.219 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:10.335.363 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:10.335.417 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:15.335.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:15.335.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:20.335.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:20.335.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:25.335.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:25.336.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:30.336.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:30.336.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:35.336.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:35.336.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:40.337.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:40.337.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:45.337.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:45.337.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:50.337.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:50.337.814 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:55.337.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:45:55.338.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:00.338.153 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:00.338.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:05.338.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:05.338.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:10.338.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:10.338.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:15.338.765 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:15.338.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:20.338.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:20.339.032 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:25.339.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:25.339.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:30.339.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:30.339.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:35.339.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:35.339.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:40.339.832 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:40.339.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:45.340.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:45.340.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:50.340.255 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:50.340.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:55.340.472 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:46:55.340.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:00.340.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:00.340.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:05.340.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:05.340.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:10.341.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:10.341.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:15.341.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:15.341.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:20.341.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:20.341.612 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:25.341.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:25.341.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:30.341.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:30.342.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:35.342.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:35.342.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:40.342.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:40.342.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:45.342.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:45.342.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:50.342.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:50.344.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:55.344.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:47:55.344.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:00.344.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:00.344.454 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:05.344.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:05.344.659 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:10.345.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:10.345.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:15.345.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:15.345.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:20.345.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:20.345.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:25.346.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:25.346.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:30.346.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:30.346.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:35.346.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:35.346.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:40.346.766 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:40.346.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:45.346.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:45.347.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:50.347.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:50.347.234 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:55.347.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:48:55.347.443 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:00.347.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:00.347.644 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:05.347.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:05.347.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:10.348.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:10.348.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:15.348.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:15.349.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:20.349.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:20.349.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:25.349.829 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:25.349.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:30.350.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:30.350.112 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:35.350.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:35.350.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:40.351.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:40.351.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:45.351.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:45.351.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:50.351.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:50.351.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:55.351.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:49:55.351.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:00.351.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:00.352.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:05.352.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:05.352.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:10.352.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:10.352.445 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:15.352.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:15.352.659 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:20.352.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:20.352.868 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:25.353.023 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:25.353.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:30.353.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:30.353.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:35.353.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:35.353.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:40.353.673 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:40.354.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:45.354.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:45.354.634 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:50.354.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:50.354.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:55.354.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:50:55.355.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:00.355.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:00.355.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:05.355.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:05.355.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:10.355.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:10.355.681 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:15.355.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:15.355.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:20.356.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:20.357.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:25.357.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:25.357.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:30.357.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:30.357.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:35.357.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:35.357.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:40.358.113 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:40.358.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:45.358.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:45.358.353 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:50.358.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:50.358.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:55.358.710 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:51:55.358.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:00.358.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:00.359.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:05.359.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:05.359.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:10.359.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:10.359.471 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:15.360.247 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:15.360.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:20.360.455 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:20.360.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:25.360.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:25.360.747 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:30.360.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:30.360.961 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:35.361.115 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:35.361.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:40.361.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:40.361.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:45.361.524 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:45.363.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:50.363.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:50.363.540 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:55.363.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:52:55.363.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:00.363.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:00.363.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:05.364.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:05.364.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:10.364.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:10.364.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:15.364.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:15.364.659 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:20.364.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:20.364.871 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:25.365.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:25.365.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:30.365.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:30.365.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:35.365.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:35.365.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:40.365.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:40.365.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:45.365.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:45.365.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:50.366.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:50.366.237 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:55.366.376 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:53:55.366.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:00.366.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:00.366.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:05.366.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:05.366.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:10.367.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:10.368.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:15.368.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:15.368.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:20.368.707 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:20.368.791 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:25.368.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:25.369.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:30.369.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:30.369.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:35.369.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:35.369.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:40.369.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:40.369.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:45.369.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:45.369.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:50.370.059 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:50.370.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:55.370.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:54:55.370.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:00.370.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:00.370.603 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:05.370.759 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:05.370.818 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:10.370.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:10.371.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:15.371.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:15.371.273 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:20.372.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:20.372.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:25.372.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:25.372.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:30.372.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:30.372.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:35.372.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:35.373.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:40.373.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:40.373.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:45.373.884 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:45.373.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:50.374.087 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:50.374.143 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:55.374.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:55:55.374.356 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:00.374.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:00.374.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:05.374.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:05.374.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:10.374.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:10.375.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:15.375.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:15.375.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:20.375.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:20.375.459 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:25.375.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:25.375.721 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:30.375.871 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:30.375.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:35.376.101 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:35.376.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:40.376.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:40.376.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:45.376.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:45.376.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:50.376.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:50.376.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:55.376.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:56:55.376.996 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:00.377.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:00.377.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:05.378.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:05.378.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:10.378.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:10.378.289 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:15.378.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:15.378.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:20.378.648 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:20.378.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:25.378.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:25.378.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:30.379.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:30.379.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:35.379.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:35.379.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:40.379.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:40.380.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:45.380.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:45.381.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:50.381.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:50.381.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:55.381.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:57:55.382.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:00.382.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:00.382.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:05.382.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:05.382.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:10.382.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:10.382.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:15.383.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:15.384.057 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:20.384.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:20.384.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:25.384.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:25.384.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:30.384.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:30.384.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:35.384.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:36.196.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:41.196.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:41.200.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:46.201.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:46.202.221 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:51.202.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:51.202.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:56.217.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:58:56.217.736 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:01.219.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:01.219.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:06.219.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:06.220.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:11.220.719 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:11.225.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:16.225.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:16.227.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:21.227.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:21.227.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:26.273.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:26.273.478 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:31.278.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:31.280.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:36.280.842 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:36.280.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:41.281.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:41.283.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:46.283.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:46.283.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:51.283.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:51.285.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:56.285.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-21:59:56.286.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:01.286.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:01.286.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:06.288.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:06.288.741 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:11.299.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:11.299.242 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:16.328.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:16.328.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:21.328.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:21.328.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:26.329.068 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:26.329.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:31.329.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:31.329.984 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:36.330.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:36.330.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:41.330.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:41.330.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:46.330.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:46.330.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:51.330.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:51.330.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:56.330.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:00:56.331.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:01.331.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:01.331.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:06.331.413 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:06.331.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:11.331.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:11.331.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:16.331.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:16.331.906 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:21.332.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:21.332.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:26.332.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:26.332.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:31.332.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:31.332.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:36.332.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:36.332.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:41.332.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:41.332.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:46.333.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:46.333.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:51.333.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:51.333.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:56.333.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:01:56.334.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:01.334.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:01.334.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:06.334.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:06.334.781 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:11.334.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:11.334.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:16.335.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:16.335.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:21.335.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:21.335.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:26.335.561 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:26.335.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:31.335.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:31.335.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:36.335.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:36.336.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:41.336.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:41.336.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:46.336.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:46.336.484 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:51.336.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:51.336.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:56.336.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:02:56.336.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:01.337.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:01.337.092 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:06.337.255 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:06.337.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:11.337.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:11.337.573 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:16.337.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:16.337.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:21.337.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:21.338.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:26.338.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:26.338.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:31.338.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:31.338.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:36.338.595 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:36.338.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:41.338.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:41.338.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:46.339.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:46.339.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:51.339.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:51.339.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:56.339.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:03:56.339.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:01.339.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:01.340.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:06.340.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:06.340.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:11.340.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:11.340.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:16.340.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:16.341.033 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:21.341.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:21.341.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:26.341.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:26.341.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:31.341.608 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:31.341.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:36.341.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:36.341.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:41.342.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:41.342.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:46.342.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:46.342.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:51.342.454 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:51.342.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:56.342.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:04:56.342.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:01.342.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:01.342.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:06.343.083 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:06.343.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:11.343.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:11.343.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:16.343.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:16.343.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:21.343.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:21.343.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:26.343.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:26.344.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:31.344.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:31.344.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:36.345.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:36.345.109 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:41.345.263 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:41.345.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:46.345.483 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:46.345.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:51.345.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:51.345.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:56.345.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:05:56.346.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:01.346.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:01.346.218 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:06.346.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:06.346.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:11.346.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:11.346.702 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:16.346.846 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:16.346.901 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:21.347.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:21.347.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:26.347.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:26.347.320 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:31.347.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:31.347.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:36.347.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:36.347.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:41.347.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:41.347.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:46.348.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:46.348.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:51.348.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:51.349.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:56.349.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:06:56.349.356 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:01.349.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:01.349.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:06.349.709 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:06.349.780 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:11.349.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:11.349.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:16.350.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:16.350.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:21.350.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:21.350.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:26.350.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:26.350.620 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:31.350.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:31.350.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:36.351.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:36.351.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:41.351.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:41.351.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:46.351.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:46.351.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:51.351.618 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:51.351.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:56.351.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:07:56.351.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:01.352.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:01.352.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:06.352.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:06.352.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:11.352.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:11.352.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:16.352.641 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:16.352.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:21.352.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:21.352.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:26.353.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:26.353.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:31.353.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:31.353.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:36.353.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:36.353.607 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:41.353.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:41.353.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:46.353.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:46.354.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:51.354.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:51.354.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:56.354.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:08:56.354.554 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:01.354.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:01.354.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:06.354.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:06.355.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:11.355.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:11.355.243 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:16.355.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:16.355.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:21.355.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:21.355.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:26.355.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:26.355.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:31.356.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:31.356.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:36.356.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:36.356.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:41.356.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:41.356.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:46.356.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:46.356.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:51.356.896 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:51.356.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:56.357.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:09:56.357.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:01.357.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:01.357.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:06.357.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:06.357.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:11.357.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:11.357.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:16.357.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:16.358.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:21.358.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:21.359.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:26.359.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:26.359.246 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:31.359.390 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:31.359.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:36.359.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:36.359.662 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:41.359.819 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:41.359.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:46.360.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:46.360.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:51.360.247 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:51.360.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:56.360.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:10:56.360.521 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:01.360.680 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:01.360.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:06.360.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:06.360.986 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:11.361.139 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:11.361.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:16.361.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:16.361.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:21.361.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:21.361.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:26.361.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:26.361.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:31.361.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:31.362.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:36.362.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:36.362.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:41.363.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:41.363.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:46.363.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:46.363.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:51.364.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:51.364.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:56.364.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:11:56.364.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:01.364.488 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:01.364.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:06.364.709 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:06.364.774 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:11.364.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:11.364.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:16.365.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:16.365.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:21.365.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:21.365.373 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:26.365.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:26.365.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:31.365.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:31.365.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:36.366.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:36.366.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:41.366.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:41.366.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:46.366.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:46.366.724 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:51.366.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:51.366.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:56.367.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:12:56.367.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:01.367.302 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:01.367.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:06.367.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:06.367.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:11.367.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:11.368.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:16.368.728 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:16.368.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:21.368.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:21.369.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:26.369.168 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:26.369.233 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:31.369.397 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:31.369.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:36.369.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:36.369.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:41.369.815 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:41.369.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:46.370.024 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:46.370.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:51.370.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:51.370.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:56.370.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:13:56.370.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:01.370.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:01.370.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:06.370.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:06.370.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:11.371.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:11.371.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:16.371.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:16.371.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:21.371.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:21.371.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:26.371.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:26.371.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:31.371.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:31.372.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:36.372.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:36.372.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:41.372.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:41.372.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:46.372.580 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:46.372.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:51.372.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:51.372.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:56.372.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:14:56.373.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:01.373.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:01.373.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:06.373.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:06.373.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:11.374.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:11.374.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:16.375.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:16.375.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:21.375.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:21.375.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:26.376.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:26.376.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:31.376.975 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:31.377.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:36.377.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:36.377.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:41.378.273 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:41.378.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:46.378.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:46.378.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:51.378.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:51.378.783 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:56.380.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:15:56.380.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:01.380.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:01.381.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:06.381.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:06.381.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:11.381.551 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:11.381.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:16.381.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:16.381.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:21.381.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:21.382.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:26.382.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:26.382.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:31.382.383 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:31.382.445 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:36.382.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:36.382.645 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:41.382.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:41.382.880 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:46.383.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:46.383.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:51.383.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:51.383.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:56.383.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:16:56.383.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:01.383.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:01.383.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:06.383.887 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:06.383.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:11.384.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:11.384.209 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:16.384.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:16.384.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:21.384.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:21.384.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:26.384.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:26.384.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:31.384.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:31.385.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:36.385.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:36.385.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:41.385.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:41.385.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:46.385.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:46.385.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:51.385.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:51.385.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:56.386.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:17:56.386.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:01.386.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:01.386.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:06.386.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:06.387.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:11.387.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:11.387.386 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:16.387.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:16.387.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:21.387.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:21.387.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:26.387.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:26.388.018 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:31.388.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:31.388.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:36.388.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:36.388.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:41.388.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:41.388.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:46.388.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:46.388.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:51.389.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:51.389.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:56.389.265 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:18:56.389.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:01.389.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:01.389.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:06.389.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:06.389.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:11.389.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:11.390.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:16.390.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:16.390.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:21.390.378 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:21.390.437 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:26.390.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:26.390.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:31.390.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:31.390.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:36.391.046 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:36.391.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:41.391.246 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:41.391.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:46.391.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:46.391.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:51.391.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:51.391.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:56.391.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:19:56.391.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:01.392.020 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:01.392.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:06.392.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:06.392.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:11.392.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:11.392.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:16.392.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:16.392.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:21.392.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:21.393.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:26.393.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:26.393.740 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:31.393.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:31.393.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:36.394.108 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:36.394.176 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:41.394.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:41.394.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:46.394.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:46.394.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:51.394.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:51.394.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:56.394.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:20:56.395.055 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:01.395.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:01.395.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:06.395.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:06.395.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:11.395.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:11.395.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:16.395.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:16.395.942 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:21.396.087 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:21.396.165 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:26.396.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:26.396.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:31.396.570 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:31.396.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:36.396.795 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:36.396.859 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:41.397.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:41.397.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:46.397.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:46.397.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:51.397.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:51.397.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:56.397.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:21:56.397.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:01.398.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:01.398.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:06.398.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:06.398.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:11.398.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:11.398.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:16.398.849 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:16.398.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:21.399.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:21.399.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:26.399.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:26.399.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:31.399.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:31.399.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:36.399.839 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:36.399.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:41.400.050 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:41.400.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:46.400.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:46.400.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:51.400.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:51.400.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:56.400.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:22:56.400.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:01.400.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:01.401.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:06.401.207 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:06.401.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:11.401.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:11.401.579 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:16.401.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:16.401.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:21.401.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:21.402.058 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:26.402.199 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:26.402.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:31.402.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:31.402.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:36.402.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:36.402.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:41.402.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:41.402.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:46.403.153 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:46.403.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:51.403.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:51.403.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:56.403.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:23:56.403.705 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:01.403.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:01.403.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:06.404.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:06.404.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:11.404.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:11.404.409 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:16.404.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:16.404.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:21.404.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:21.404.865 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:26.405.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:26.405.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:31.405.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:31.405.890 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:36.406.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:36.406.133 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:41.406.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:41.406.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:46.406.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:46.406.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:51.406.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:51.406.926 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:56.407.075 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:24:56.407.136 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:01.407.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:01.407.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:06.407.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:06.407.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:11.407.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:11.407.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:16.408.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:16.408.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:21.408.237 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:21.408.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:26.408.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:26.408.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:31.408.707 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:31.408.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:36.408.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:36.408.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:41.409.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:41.409.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:46.409.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:46.409.405 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:51.409.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:51.410.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:56.410.395 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:25:56.410.496 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:01.410.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:01.410.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:06.410.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:06.410.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:11.411.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:11.411.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:16.411.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:16.411.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:21.411.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:21.411.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:26.411.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:26.411.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:31.412.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:31.412.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:36.412.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:36.412.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:41.412.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:41.412.652 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:46.412.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:46.412.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:51.413.042 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:51.413.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:56.413.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:26:56.413.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:01.413.503 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:01.413.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:06.413.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:06.413.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:11.413.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:11.414.066 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:16.414.218 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:16.414.332 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:21.414.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:21.414.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:26.414.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:26.414.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:31.414.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:31.415.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:36.415.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:36.415.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:41.415.465 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:41.415.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:46.415.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:46.415.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:51.415.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:51.415.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:56.416.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:27:56.416.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:01.416.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:01.416.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:06.416.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:06.416.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:11.416.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:11.416.930 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:16.417.144 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:16.417.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:21.417.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:21.417.543 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:26.417.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:26.417.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:31.417.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:31.418.037 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:36.418.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:36.418.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:41.418.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:41.418.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:46.418.649 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:46.418.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:51.418.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:51.418.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:56.419.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:28:56.419.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:01.419.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:01.419.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:06.419.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:06.419.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:11.419.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:11.419.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:16.420.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:16.420.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:21.420.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:21.420.404 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:26.420.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:26.420.679 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:31.420.833 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:31.420.941 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:36.421.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:36.421.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:41.421.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:41.421.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:46.421.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:46.421.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:51.421.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:51.421.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:56.422.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:29:56.422.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:01.422.288 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:01.422.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:06.422.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:06.422.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:11.422.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:11.422.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:16.422.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:16.423.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:21.423.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:21.423.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:26.423.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:26.423.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:31.423.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:31.423.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:36.424.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:36.424.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:41.424.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:41.424.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:46.424.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:46.425.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:51.425.864 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:51.425.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:56.426.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:30:56.426.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:01.426.308 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:01.426.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:06.426.503 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:06.426.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:11.426.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:11.426.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:16.426.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:16.427.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:21.427.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:21.427.251 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:26.427.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:26.427.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:31.427.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:31.427.729 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:36.427.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:36.427.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:41.428.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:41.428.150 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:46.428.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:46.428.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:51.428.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:51.428.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:56.428.709 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:31:56.428.818 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:01.428.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:01.429.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:06.429.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:06.429.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:11.429.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:11.430.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:16.430.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:16.430.999 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:21.431.135 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:21.431.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:26.431.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:26.431.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:31.431.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:31.431.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:36.431.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:36.431.826 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:41.431.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:41.431.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:46.432.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:46.432.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:51.432.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:51.432.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:56.432.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:32:56.432.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:01.432.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:01.432.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:06.432.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:06.433.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:11.433.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:11.433.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:16.433.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:16.433.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:21.433.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:21.433.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:26.433.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:26.433.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:31.441.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:31.441.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:36.444.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:36.445.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:41.445.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:41.445.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:46.457.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:46.457.684 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:51.458.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:51.459.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:56.459.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:33:56.459.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:01.477.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:01.477.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:06.478.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:06.481.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:11.482.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:11.483.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:16.484.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:17.311.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:22.311.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:22.311.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:27.311.385 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:27.311.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:32.311.560 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:32.311.614 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:37.311.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:37.316.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:42.316.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:42.316.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:47.316.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:47.318.138 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:52.318.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:52.318.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:57.318.488 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:34:57.318.546 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:02.322.065 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:02.324.373 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:07.324.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:07.324.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:12.343.501 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:12.343.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:17.343.706 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:17.343.762 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:22.344.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:22.344.887 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:27.345.028 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:27.345.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:32.345.264 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:32.345.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:37.345.504 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:37.345.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:42.345.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:42.345.765 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:47.345.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:47.345.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:52.346.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:52.346.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:57.346.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:35:57.346.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:02.346.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:02.346.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:07.346.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:07.346.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:12.346.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:12.347.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:17.347.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:17.347.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:22.347.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:22.347.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:27.347.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:27.347.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:32.347.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:32.347.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:37.348.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:37.348.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:42.348.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:42.348.369 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:47.348.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:47.348.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:52.348.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:52.348.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:57.348.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:36:57.348.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:02.349.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:02.349.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:07.349.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:07.349.417 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:12.349.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:12.349.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:17.349.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:17.349.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:22.349.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:22.350.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:27.350.176 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:27.350.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:32.350.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:32.350.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:37.350.596 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:37.350.659 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:42.350.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:42.350.868 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:47.351.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:47.351.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:52.351.244 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:52.351.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:57.352.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:37:57.352.236 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:02.352.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:02.352.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:07.352.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:07.352.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:12.352.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:12.352.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:17.353.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:17.353.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:22.353.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:22.353.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:27.353.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:27.353.533 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:32.353.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:32.354.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:37.354.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:37.354.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:42.354.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:42.354.787 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:47.354.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:47.355.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:52.355.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:52.355.219 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:57.355.366 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:38:57.355.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:02.355.582 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:02.355.641 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:07.355.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:07.355.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:12.356.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:12.356.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:17.356.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:17.356.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:22.356.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:22.356.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:27.356.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:27.356.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:32.357.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:32.357.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:37.357.290 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:37.357.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:42.357.499 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:42.357.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:47.357.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:47.357.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:52.357.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:52.357.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:57.358.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:39:57.358.787 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:02.358.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:02.358.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:07.359.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:07.359.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:12.359.390 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:12.359.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:17.359.599 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:17.359.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:22.359.809 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:22.359.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:27.360.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:27.360.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:32.360.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:32.360.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:37.360.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:37.360.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:42.360.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:42.360.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:47.360.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:47.360.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:52.361.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:52.361.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:57.361.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:40:57.361.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:02.361.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:02.361.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:07.361.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:07.361.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:12.361.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:12.361.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:17.362.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:17.362.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:22.362.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:22.363.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:27.363.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:27.363.290 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:32.363.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:32.363.480 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:37.363.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:37.363.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:42.363.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:42.363.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:47.364.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:47.364.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:52.364.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:52.364.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:57.364.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:41:57.364.517 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:02.364.671 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:02.364.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:07.364.913 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:07.364.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:12.365.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:12.365.168 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:17.365.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:17.365.378 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:22.365.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:22.365.588 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:27.365.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:27.365.801 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:32.365.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:32.366.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:37.366.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:37.366.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:42.366.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:42.366.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:47.366.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:47.366.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:52.366.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:52.366.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:57.367.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:42:57.367.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:02.367.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:02.368.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:07.368.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:07.368.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:12.368.366 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:12.368.428 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:17.368.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:17.368.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:22.368.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:22.368.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:27.368.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:27.370.331 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:32.370.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:32.370.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:37.370.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:37.370.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:42.370.928 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:42.370.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:47.371.134 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:47.371.191 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:52.371.343 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:52.371.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:57.371.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:43:57.371.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:02.372.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:02.372.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:07.372.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:07.372.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:12.372.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:12.372.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:17.372.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:17.373.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:22.373.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:22.373.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:27.373.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:27.373.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:32.373.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:32.373.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:37.373.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:37.373.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:42.374.005 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:42.374.064 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:47.375.688 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:47.375.760 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:52.375.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:52.376.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:57.376.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:44:57.376.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:02.376.336 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:02.376.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:07.376.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:07.376.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:12.376.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:12.376.932 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:17.377.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:17.377.133 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:22.377.301 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:22.377.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:27.377.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:27.377.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:32.377.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:32.377.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:37.378.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:37.378.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:42.378.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:42.378.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:47.379.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:47.379.127 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:52.379.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:52.379.334 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:57.379.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:45:57.379.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:02.379.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:02.379.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:07.379.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:07.379.989 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:12.380.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:12.380.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:17.380.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:17.381.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:22.381.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:22.381.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:27.382.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:27.382.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:32.382.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:32.382.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:37.383.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:37.383.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:42.383.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:42.383.469 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:47.383.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:47.383.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:52.383.826 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:52.383.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:57.384.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:46:57.384.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:02.384.282 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:02.384.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:07.384.492 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:07.384.555 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:12.384.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:12.384.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:17.384.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:17.384.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:22.385.123 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:22.385.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:27.385.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:27.385.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:32.385.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:32.385.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:37.385.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:37.385.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:42.386.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:42.386.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:47.386.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:47.386.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:52.387.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:52.387.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:57.387.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:47:57.387.402 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:02.387.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:02.387.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:07.387.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:07.387.895 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:12.388.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:12.388.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:17.388.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:17.388.308 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:22.388.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:22.388.523 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:27.388.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:27.388.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:32.388.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:32.388.956 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:37.389.100 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:37.389.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:42.389.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:42.389.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:47.390.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:47.390.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:52.390.488 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:52.390.578 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:57.390.719 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:48:57.390.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:02.390.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:02.390.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:07.391.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:07.391.215 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:12.391.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:12.391.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:17.391.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:17.391.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:22.391.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:22.391.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:27.392.018 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:27.392.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:32.392.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:32.392.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:37.393.124 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:37.393.192 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:42.393.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:42.393.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:47.393.539 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:47.394.362 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:52.394.513 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:52.394.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:57.394.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:49:57.394.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:02.395.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:02.395.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:07.395.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:07.395.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:12.395.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:12.395.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:17.395.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:17.395.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:22.395.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:22.396.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:27.396.234 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:27.396.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:32.396.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:32.396.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:37.396.725 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:37.396.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:42.396.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:42.397.085 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:47.397.254 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:47.397.339 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:52.397.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:52.397.642 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:57.397.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:50:57.397.894 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:02.398.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:02.398.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:07.398.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:07.398.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:12.398.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:12.399.351 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:17.399.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:17.399.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:22.399.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:22.399.787 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:27.399.927 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:27.399.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:32.400.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:32.400.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:37.401.021 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:37.401.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:42.401.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:42.401.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:47.401.441 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:47.401.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:52.402.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:52.402.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:57.402.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:51:57.402.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:02.402.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:02.402.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:07.402.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:07.402.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:12.403.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:12.403.215 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:17.403.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:17.403.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:22.403.572 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:22.403.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:27.403.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:27.403.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:32.404.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:32.404.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:37.404.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:37.405.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:42.405.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:42.405.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:47.405.894 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:47.405.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:52.406.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:52.406.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:57.406.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:52:57.406.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:02.406.494 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:02.406.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:07.406.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:07.406.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:12.406.900 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:12.406.960 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:17.407.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:17.407.178 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:22.407.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:22.407.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:27.407.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:27.407.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:32.407.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:32.407.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:37.407.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:37.408.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:42.408.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:42.408.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:47.408.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:47.408.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:52.408.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:52.408.767 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:57.408.917 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:53:57.408.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:02.409.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:02.409.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:07.410.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:07.410.106 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:12.410.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:12.411.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:17.411.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:17.411.254 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:22.411.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:22.411.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:27.411.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:27.411.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:32.411.802 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:32.411.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:37.412.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:37.412.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:42.412.243 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:42.412.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:47.412.455 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:47.412.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:52.412.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:52.412.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:57.412.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:54:57.412.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:02.413.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:02.413.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:07.413.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:07.413.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:12.413.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:12.413.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:17.413.709 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:17.413.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:22.413.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:22.413.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:27.414.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:27.414.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:32.414.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:32.414.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:37.414.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:37.414.626 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:42.414.767 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:42.414.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:47.414.968 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:47.415.025 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:52.415.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:52.415.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:57.415.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:55:57.415.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:02.415.592 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:02.415.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:07.415.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:07.415.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:12.416.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:12.416.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:17.416.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:17.416.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:22.416.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:22.416.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:27.416.664 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:27.416.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:32.416.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:32.416.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:37.417.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:37.417.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:42.417.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:42.417.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:47.417.553 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:47.417.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:52.417.783 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:52.417.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:57.417.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:56:57.418.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:02.418.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:02.418.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:07.418.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:07.418.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:12.418.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:12.418.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:17.418.815 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:17.418.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:22.419.005 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:22.419.064 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:27.419.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:27.419.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:32.419.488 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:32.420.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:37.420.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:37.420.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:42.420.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:42.420.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:47.421.003 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:47.421.062 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:52.421.207 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:52.421.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:57.421.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:57:57.421.476 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:02.421.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:02.421.686 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:07.421.831 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:07.421.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:12.422.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:12.422.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:17.422.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:17.422.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:22.422.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:22.422.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:27.422.734 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:27.422.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:32.422.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:32.423.001 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:37.423.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:37.423.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:42.423.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:42.423.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:47.423.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:47.423.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:52.423.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:52.423.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:57.423.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:58:57.424.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:02.424.235 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:02.424.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:07.424.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:07.424.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:12.424.649 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:12.424.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:17.424.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:17.424.918 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:22.425.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:22.425.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:27.426.182 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:27.426.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:32.426.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:32.426.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:37.426.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:37.426.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:42.426.806 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:42.426.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:47.427.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:47.427.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:52.427.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:52.427.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:57.427.415 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-22:59:57.427.474 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:02.427.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:02.427.686 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:07.427.836 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:07.427.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:12.428.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:12.428.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:17.428.262 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:17.428.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:22.428.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:22.429.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:27.429.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:27.429.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:32.430.101 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:32.430.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:37.430.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:37.430.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:42.430.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:42.430.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:47.430.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:47.430.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:52.431.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:52.431.141 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:57.431.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:00:57.431.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:02.431.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:02.431.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:07.431.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:07.431.783 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:12.431.932 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:12.431.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:17.432.129 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:17.432.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:22.432.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:22.432.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:27.432.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:27.432.698 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:32.432.837 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:32.432.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:37.433.033 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:37.433.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:42.433.214 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:42.433.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:47.433.443 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:47.433.503 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:52.433.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:52.433.797 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:57.433.931 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:01:57.433.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:02.434.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:02.434.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:07.434.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:07.434.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:12.434.603 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:12.434.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:17.434.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:17.434.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:22.435.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:22.435.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:27.435.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:27.435.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:32.435.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:32.435.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:37.435.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:37.435.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:42.435.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:42.435.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:47.436.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:47.436.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:52.436.307 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:52.436.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:57.436.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:02:57.436.550 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:02.436.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:02.436.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:07.436.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:07.436.966 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:12.437.147 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:12.437.230 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:17.437.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:17.437.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:22.437.583 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:22.437.642 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:27.437.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:27.437.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:32.437.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:32.438.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:37.438.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:37.438.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:42.438.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:42.438.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:47.438.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:47.438.714 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:52.438.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:52.439.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:57.439.732 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:03:57.439.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:02.439.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:02.440.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:07.440.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:07.440.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:12.440.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:12.440.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:17.440.572 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:17.440.672 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:22.440.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:22.440.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:27.441.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:27.441.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:32.441.319 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:32.441.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:37.441.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:37.441.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:42.441.814 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:42.441.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:47.442.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:47.442.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:52.442.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:52.442.299 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:57.442.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:04:57.442.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:02.442.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:02.442.718 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:07.442.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:07.442.921 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:12.443.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:12.443.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:17.443.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:17.443.417 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:22.443.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:22.443.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:27.444.374 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:27.444.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:32.444.581 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:32.444.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:37.444.800 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:37.444.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:42.445.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:42.445.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:47.445.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:47.445.303 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:52.445.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:52.445.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:57.445.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:05:57.445.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:02.445.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:02.446.005 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:07.446.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:07.446.228 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:12.446.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:12.446.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:17.446.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:17.446.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:22.446.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:22.446.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:27.447.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:27.447.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:32.447.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:32.447.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:37.447.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:37.447.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:42.447.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:42.449.114 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:47.449.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:47.449.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:52.449.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:52.449.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:57.449.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:06:57.449.894 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:02.450.035 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:02.450.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:07.450.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:07.450.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:12.450.480 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:12.450.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:17.450.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:17.450.757 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:22.450.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:22.451.080 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:27.451.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:27.451.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:32.451.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:32.451.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:37.451.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:37.451.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:42.451.988 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:42.452.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:47.452.218 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:47.452.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:52.452.453 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:52.452.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:57.452.781 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:07:57.452.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:02.453.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:02.456.973 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:07.457.158 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:07.457.216 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:12.457.346 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:12.457.445 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:17.457.596 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:17.457.663 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:22.457.816 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:22.457.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:27.458.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:27.458.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:32.458.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:32.458.296 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:37.458.445 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:37.459.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:42.459.905 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:42.461.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:47.461.175 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:47.466.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:52.467.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:52.467.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:57.467.238 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:08:57.471.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:02.471.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:02.471.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:07.471.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:07.471.502 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:12.471.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:12.474.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:17.474.813 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:17.475.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:22.475.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:22.475.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:27.481.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:27.481.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:32.484.516 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:32.487.724 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:37.487.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:37.487.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:42.488.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:42.489.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:47.490.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:47.492.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:52.492.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:52.492.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:57.492.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:09:57.492.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:02.493.044 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:02.493.102 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:07.493.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:07.493.349 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:12.493.501 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:12.493.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:17.493.735 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:17.493.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:22.493.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:22.494.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:27.494.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:27.494.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:32.494.353 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:32.494.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:37.494.562 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:37.494.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:42.494.763 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:42.494.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:47.494.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:47.495.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:52.495.211 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:52.495.267 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:57.495.442 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:10:57.495.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:02.495.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:02.495.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:07.495.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:07.495.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:12.496.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:12.496.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:17.496.289 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:17.496.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:22.496.490 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:22.496.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:27.496.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:27.496.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:32.496.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:32.496.970 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:37.497.109 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:37.497.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:42.497.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:42.498.030 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:47.498.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:47.498.238 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:52.498.377 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:52.498.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:57.498.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:11:57.498.632 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:02.498.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:02.498.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:07.498.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:07.499.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:12.499.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:12.499.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:17.499.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:17.499.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:22.499.636 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:22.499.699 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:27.499.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:27.499.905 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:32.500.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:32.500.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:37.500.272 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:37.500.345 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:42.500.495 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:42.500.562 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:47.500.705 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:47.500.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:52.500.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:52.500.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:57.501.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:12:57.501.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:02.501.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:02.501.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:07.501.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:07.501.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:12.501.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:12.501.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:17.502.031 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:17.502.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:22.502.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:22.502.301 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:27.502.452 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:27.502.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:32.502.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:32.502.713 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:37.502.850 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:37.502.912 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:42.503.059 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:42.503.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:47.503.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:47.503.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:52.503.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:52.503.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:57.503.695 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:13:57.503.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:02.503.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:02.503.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:07.504.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:07.504.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:12.504.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:12.504.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:17.504.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:17.504.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:22.504.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:22.504.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:27.504.942 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:27.505.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:32.505.168 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:32.505.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:37.505.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:37.505.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:42.505.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:42.505.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:47.505.854 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:47.505.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:52.506.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:52.506.133 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:57.506.275 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:14:57.506.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:02.506.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:02.507.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:07.507.285 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:07.507.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:12.507.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:12.507.577 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:17.507.715 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:17.507.777 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:22.507.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:22.507.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:27.508.120 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:27.508.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:32.508.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:32.508.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:37.508.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:37.508.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:42.508.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:42.508.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:47.508.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:47.509.031 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:52.509.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:52.509.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:57.509.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:15:57.509.479 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:02.509.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:02.509.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:07.509.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:07.509.894 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:12.510.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:12.510.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:17.510.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:17.510.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:22.510.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:22.510.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:27.510.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:27.510.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:32.510.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:32.511.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:37.511.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:37.511.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:42.511.372 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:42.511.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:47.511.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:47.511.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:52.511.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:52.511.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:57.512.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:16:57.512.162 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:02.512.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:02.512.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:07.512.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:07.512.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:12.512.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:12.512.868 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:17.513.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:17.513.100 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:22.513.267 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:22.513.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:27.513.484 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:27.513.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:32.513.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:32.513.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:37.513.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:37.513.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:42.514.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:42.514.173 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:47.514.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:47.514.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:52.514.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:52.514.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:57.514.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:17:57.514.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:02.514.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:02.515.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:07.515.174 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:07.515.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:12.515.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:12.516.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:17.516.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:17.516.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:22.516.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:22.516.475 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:27.516.624 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:27.516.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:32.516.832 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:32.516.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:37.517.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:37.517.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:42.517.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:42.517.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:47.517.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:47.517.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:52.517.727 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:52.517.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:57.517.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:18:57.518.000 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:02.518.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:02.518.206 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:07.518.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:07.518.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:12.518.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:12.518.650 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:17.518.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:17.518.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:22.518.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:22.519.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:27.519.963 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:27.520.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:32.520.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:32.520.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:37.520.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:37.520.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:42.520.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:42.520.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:47.520.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:47.520.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:52.521.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:52.521.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:57.521.316 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:19:57.521.373 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:02.521.513 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:02.521.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:07.521.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:07.521.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:12.522.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:12.522.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:17.522.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:17.522.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:22.522.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:22.522.532 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:27.522.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:27.522.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:32.522.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:32.522.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:37.523.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:37.523.157 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:42.523.309 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:42.523.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:47.523.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:47.524.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:52.524.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:52.524.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:57.524.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:20:57.524.693 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:02.524.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:02.524.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:07.525.078 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:07.525.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:12.525.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:12.525.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:17.525.532 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:17.525.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:22.525.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:22.525.834 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:27.525.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:27.526.078 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:32.526.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:32.526.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:37.526.429 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:37.526.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:42.526.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:42.526.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:47.526.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:47.526.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:52.527.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:52.527.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:57.527.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:21:57.527.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:02.527.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:02.527.589 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:07.527.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:07.527.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:12.527.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:12.528.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:17.528.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:17.528.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:22.528.408 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:22.528.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:27.528.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:27.528.694 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:32.528.838 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:32.528.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:37.529.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:37.529.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:42.529.256 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:42.529.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:47.529.465 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:47.529.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:52.529.678 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:52.530.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:57.530.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:22:57.530.775 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:02.530.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:02.530.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:07.531.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:07.531.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:12.531.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:12.531.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:17.531.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:17.531.653 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:22.531.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:22.531.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:27.532.009 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:27.532.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:32.532.248 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:32.532.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:37.532.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:37.532.628 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:42.532.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:42.532.844 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:47.532.991 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:47.533.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:52.533.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:52.533.291 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:57.533.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:23:57.533.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:02.533.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:02.533.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:07.533.866 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:07.533.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:12.534.074 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:12.534.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:17.534.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:17.534.380 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:22.534.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:22.534.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:27.534.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:27.534.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:32.534.955 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:32.535.016 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:37.535.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:37.535.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:42.535.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:42.535.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:47.535.653 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:47.535.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:52.535.880 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:52.535.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:57.536.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:24:57.536.193 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:02.536.367 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:02.536.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:07.536.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:07.536.723 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:12.536.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:12.536.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:17.537.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:17.537.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:22.537.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:22.537.414 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:27.537.566 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:27.537.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:32.537.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:32.537.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:37.538.004 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:37.538.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:42.538.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:42.538.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:47.538.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:47.538.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:52.538.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:52.538.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:57.538.999 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:25:57.539.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:02.539.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:02.539.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:07.539.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:07.539.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:12.539.759 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:12.539.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:17.539.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:17.540.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:22.540.198 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:22.540.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:27.540.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:27.540.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:32.540.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:32.540.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:37.540.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:37.540.911 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:42.541.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:42.541.147 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:47.541.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:47.541.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:52.541.497 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:52.541.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:57.541.721 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:26:57.541.784 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:02.541.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:02.541.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:07.542.131 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:07.543.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:12.543.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:12.543.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:17.543.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:17.543.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:22.543.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:22.544.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:27.544.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:27.544.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:32.544.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:32.544.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:37.544.550 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:37.544.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:42.544.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:42.544.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:47.544.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:47.545.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:52.545.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:52.545.857 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:57.545.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:27:57.546.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:02.546.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:02.546.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:07.546.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:07.546.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:12.546.621 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:12.546.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:17.546.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:17.546.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:22.547.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:22.547.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:27.547.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:27.547.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:32.547.556 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:32.547.610 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:37.547.760 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:37.547.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:42.547.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:42.548.046 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:47.548.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:47.548.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:52.548.419 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:52.548.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:57.548.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:28:57.548.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:02.548.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:02.548.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:07.549.053 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:07.549.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:12.549.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:12.550.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:17.550.154 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:17.550.211 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:22.550.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:22.550.435 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:27.550.584 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:27.550.639 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:32.550.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:32.550.836 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:37.550.987 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:37.551.050 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:42.551.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:42.551.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:47.551.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:47.551.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:52.551.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:52.551.725 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:57.551.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:29:57.551.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:02.552.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:02.552.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:07.552.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:07.552.366 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:12.552.523 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:12.552.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:17.553.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:17.553.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:22.553.652 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:22.553.732 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:27.553.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:27.553.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:32.554.069 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:32.554.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:37.554.278 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:37.555.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:42.555.984 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:42.556.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:47.556.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:47.556.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:52.556.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:52.556.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:57.556.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:30:57.556.677 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:02.556.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:02.556.884 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:07.557.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:07.557.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:12.557.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:12.557.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:17.557.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:17.557.535 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:22.557.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:22.557.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:27.557.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:27.558.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:32.558.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:32.558.216 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:37.558.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:37.558.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:42.558.555 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:42.558.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:47.558.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:47.558.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:52.558.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:52.559.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:57.559.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:31:57.559.223 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:02.559.364 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:02.559.464 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:07.559.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:07.559.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:12.559.804 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:12.559.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:17.560.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:17.560.141 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:22.560.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:22.560.391 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:27.560.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:27.560.586 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:32.560.739 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:32.560.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:37.560.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:37.561.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:42.561.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:42.561.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:47.561.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:47.561.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:52.561.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:52.561.743 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:57.561.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:32:57.561.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:02.562.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:02.562.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:07.562.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:07.562.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:12.562.554 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:12.562.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:17.562.765 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:17.562.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:22.562.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:22.563.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:27.563.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:27.563.931 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:32.564.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:32.564.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:37.564.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:37.564.333 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:42.564.473 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:42.564.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:47.564.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:47.564.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:52.564.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:52.564.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:57.565.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:33:57.565.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:02.565.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:02.565.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:07.565.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:07.565.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:12.565.792 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:12.565.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:17.566.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:17.566.076 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:22.566.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:22.566.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:27.566.396 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:27.566.457 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:32.566.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:32.566.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:37.566.818 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:37.566.875 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:42.567.032 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:42.567.108 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:47.567.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:47.567.308 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:52.567.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:52.567.561 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:57.567.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:34:57.567.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:02.567.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:02.567.983 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:07.568.130 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:07.568.192 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:12.568.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:12.568.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:17.568.557 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:17.568.615 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:22.568.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:22.568.831 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:27.568.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:27.569.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:32.569.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:32.569.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:37.569.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:37.569.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:42.569.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:42.569.778 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:47.569.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:47.569.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:52.570.134 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:52.570.196 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:57.570.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:35:57.570.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:02.570.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:02.570.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:07.570.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:07.570.804 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:12.570.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:12.571.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:17.571.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:17.571.261 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:22.571.405 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:22.571.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:27.571.609 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:27.571.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:32.573.049 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:32.573.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:37.573.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:37.573.340 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:42.573.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:42.573.582 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:47.573.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:47.573.764 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:52.573.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:52.574.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:57.574.146 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:36:57.574.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:02.575.041 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:02.575.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:07.575.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:07.575.330 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:12.575.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:12.575.529 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:17.575.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:17.575.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:22.575.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:22.575.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:27.576.101 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:27.576.163 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:32.576.318 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:32.576.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:37.576.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:37.576.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:42.576.770 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:42.576.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:47.576.978 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:47.577.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:52.577.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:52.577.308 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:57.577.448 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:37:57.577.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:02.577.640 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:02.577.703 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:07.578.449 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:07.578.514 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:12.578.661 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:12.578.712 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:17.578.861 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:17.578.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:22.579.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:22.579.761 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:27.579.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:27.579.956 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:32.580.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:32.580.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:37.580.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:37.580.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:42.580.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:42.580.598 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:47.580.737 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:47.580.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:52.580.926 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:52.580.987 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:57.581.646 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:38:57.581.705 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:02.581.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:02.581.956 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:07.582.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:07.582.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:12.582.332 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:12.582.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:17.582.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:17.582.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:22.582.779 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:22.582.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:27.583.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:27.583.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:32.583.220 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:32.583.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:37.583.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:37.583.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:42.583.656 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:42.583.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:47.583.886 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:47.584.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:52.584.790 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:52.584.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:57.584.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:39:57.585.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:02.585.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:02.585.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:07.585.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:07.585.478 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:12.585.617 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:12.585.682 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:17.585.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:17.585.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:22.586.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:22.586.137 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:27.586.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:27.587.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:32.587.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:32.587.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:37.587.893 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:37.587.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:42.588.103 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:42.588.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:47.588.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:47.588.388 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:52.589.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:52.589.288 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:57.589.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:40:57.589.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:02.589.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:02.589.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:07.589.859 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:07.589.922 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:12.590.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:12.590.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:17.590.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:17.590.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:22.590.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:22.590.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:27.590.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:27.590.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:32.590.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:32.591.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:37.591.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:37.591.283 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:42.591.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:42.591.495 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:47.591.645 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:47.591.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:52.591.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:52.592.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:57.592.551 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:41:57.592.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:02.592.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:02.592.821 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:07.592.966 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:07.593.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:12.593.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:12.593.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:17.593.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:17.593.489 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:22.593.635 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:22.593.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:27.593.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:27.593.909 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:32.594.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:32.594.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:37.594.341 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:37.594.425 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:42.594.585 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:42.594.656 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:47.594.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:47.594.940 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:52.595.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:52.595.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:57.595.359 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:42:57.595.418 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:02.595.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:02.595.621 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:07.595.778 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:07.595.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:12.596.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:12.596.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:17.596.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:17.597.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:22.597.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:22.597.292 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:27.597.435 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:27.598.436 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:32.598.588 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:32.598.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:37.601.446 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:37.601.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:42.601.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:42.610.257 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:47.610.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:47.610.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:52.612.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:52.612.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:57.638.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:43:57.638.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:02.647.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:02.647.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:07.647.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:07.647.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:12.649.713 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:12.649.820 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:17.649.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:17.650.031 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:22.652.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:22.652.595 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:27.663.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:27.663.920 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:32.664.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:32.664.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:37.664.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:37.664.936 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:42.665.089 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:42.667.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:47.667.179 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:47.667.232 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:52.679.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:52.679.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:57.679.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:44:57.679.687 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:02.679.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:02.679.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:07.680.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:07.680.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:12.680.296 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:12.680.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:17.680.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:17.680.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:22.680.708 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:22.680.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:27.680.940 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:27.680.998 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:32.681.141 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:32.681.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:37.681.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:37.681.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:42.681.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:42.681.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:47.681.756 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:47.681.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:52.681.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:52.682.045 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:57.682.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:45:57.682.242 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:02.682.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:02.682.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:07.682.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:07.682.728 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:12.682.872 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:12.682.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:17.683.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:17.683.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:22.683.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:22.683.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:27.683.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:27.683.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:32.683.717 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:32.683.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:37.683.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:37.684.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:42.684.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:42.684.302 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:47.684.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:47.685.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:52.685.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:52.685.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:57.685.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:46:57.685.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:02.686.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:02.686.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:07.686.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:07.686.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:12.686.919 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:12.686.977 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:17.687.127 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:17.687.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:22.687.344 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:22.687.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:27.687.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:27.687.635 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:32.687.807 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:32.687.869 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:37.688.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:37.688.065 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:42.688.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:42.688.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:47.688.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:47.688.502 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:52.688.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:52.688.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:57.688.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:47:57.688.935 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:02.689.075 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:02.689.131 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:07.689.284 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:07.689.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:12.689.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:12.690.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:17.690.992 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:17.691.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:22.691.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:22.691.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:27.691.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:27.691.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:32.691.637 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:32.691.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:37.691.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:37.691.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:42.692.064 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:42.692.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:47.692.271 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:47.692.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:52.692.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:52.692.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:57.692.703 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:48:57.692.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:02.692.904 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:02.692.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:07.693.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:07.693.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:12.693.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:12.693.374 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:17.693.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:17.693.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:22.693.779 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:22.693.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:27.693.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:27.694.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:32.694.188 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:32.694.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:37.694.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:37.694.485 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:42.694.627 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:42.694.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:47.694.847 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:47.694.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:52.695.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:52.695.124 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:57.695.260 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:49:57.695.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:02.695.468 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:02.695.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:07.695.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:07.695.739 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:12.695.883 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:12.695.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:17.696.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:17.696.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:22.696.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:22.696.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:27.696.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:27.696.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:32.696.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:32.696.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:37.696.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:37.697.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:42.697.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:42.697.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:47.697.425 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:47.697.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:52.697.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:52.697.707 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:57.697.856 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:50:57.697.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:02.698.055 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:02.698.660 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:07.698.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:07.698.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:12.699.022 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:12.699.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:17.699.233 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:17.699.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:22.699.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:22.699.508 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:27.699.679 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:27.699.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:32.699.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:32.699.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:37.700.099 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:37.700.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:42.700.379 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:42.700.438 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:47.700.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:47.700.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:52.700.810 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:52.700.870 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:57.701.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:51:57.701.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:02.701.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:02.701.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:07.701.493 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:07.701.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:12.701.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:12.701.833 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:17.701.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:17.702.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:22.702.180 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:22.702.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:27.702.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:27.703.341 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:32.703.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:32.703.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:37.703.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:37.703.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:42.703.900 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:42.703.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:47.704.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:47.704.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:52.704.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:52.704.419 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:57.704.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:52:57.704.605 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:02.704.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:02.704.805 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:07.704.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:07.705.072 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:12.705.223 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:12.705.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:17.706.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:17.706.126 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:22.706.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:22.706.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:27.706.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:27.706.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:32.706.794 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:32.706.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:37.707.010 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:37.707.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:42.707.226 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:42.707.291 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:47.707.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:47.707.499 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:52.707.676 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:52.707.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:57.707.889 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:53:57.707.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:02.708.094 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:02.708.167 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:07.708.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:07.708.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:12.708.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:12.708.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:17.708.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:17.708.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:22.708.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:22.709.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:27.709.150 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:27.709.214 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:32.709.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:32.710.068 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:37.710.203 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:37.710.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:42.710.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:42.710.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:47.710.627 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:47.710.685 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:52.710.823 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:52.710.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:57.711.043 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:54:57.711.102 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:02.711.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:02.711.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:07.711.477 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:07.711.544 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:12.711.696 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:12.711.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:17.711.918 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:17.711.968 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:22.712.116 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:22.712.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:27.712.313 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:27.712.373 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:32.712.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:32.712.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:37.712.742 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:37.712.802 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:42.712.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:42.713.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:47.713.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:47.713.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:52.713.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:52.714.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:57.714.869 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:55:57.715.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:02.715.791 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:02.715.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:07.716.015 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:07.716.077 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:12.716.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:12.716.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:17.716.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:17.716.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:22.716.626 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:22.716.689 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:27.716.832 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:27.716.893 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:32.717.047 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:32.717.105 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:37.717.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:37.717.355 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:42.717.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:42.717.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:47.717.726 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:47.717.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:52.717.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:52.717.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:57.718.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:56:57.718.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:02.718.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:02.718.439 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:07.718.576 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:07.718.642 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:12.718.784 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:12.718.841 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:17.718.990 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:17.719.056 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:22.719.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:22.719.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:27.720.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:27.720.175 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:32.720.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:32.720.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:37.720.515 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:37.720.608 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:42.720.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:42.720.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:47.720.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:47.721.053 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:52.721.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:52.721.276 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:57.721.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:57:57.721.477 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:02.721.628 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:02.721.688 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:07.721.841 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:07.721.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:12.722.056 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:12.722.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:17.722.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:17.722.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:22.722.534 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:22.722.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:27.722.752 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:27.722.823 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:32.722.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:32.723.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:37.723.199 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:37.723.259 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:42.723.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:42.723.488 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:47.723.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:47.724.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:52.724.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:52.724.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:57.724.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:58:57.724.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:02.724.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:02.725.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:07.725.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:07.725.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:12.725.422 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:12.725.482 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:17.725.623 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:17.725.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:22.725.828 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:22.725.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:27.726.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:27.726.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:32.726.259 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:32.726.319 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:37.726.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:37.726.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:42.726.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:42.726.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:47.726.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:47.726.976 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:52.727.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:52.727.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:57.727.326 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-25-23:59:57.727.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:02.727.510 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:02.727.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:07.727.730 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:07.727.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:12.728.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:12.728.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:17.728.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:17.728.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:22.728.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:22.728.572 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:27.728.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:27.728.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:32.728.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:32.729.020 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:37.729.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:37.729.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:42.730.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:42.730.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:47.730.276 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:47.730.350 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:52.730.514 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:52.731.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:57.731.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:00:57.731.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:02.731.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:02.731.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:07.731.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:07.731.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:12.732.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:12.732.231 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:17.732.390 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:17.732.492 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:22.732.662 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:22.732.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:27.732.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:27.732.969 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:32.733.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:32.733.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:37.733.335 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:37.733.395 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:42.733.542 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:42.733.634 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:47.733.779 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:47.733.851 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:52.734.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:52.734.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:57.734.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:01:57.734.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:02.734.450 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:02.734.525 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:07.734.674 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:07.734.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:12.734.873 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:12.734.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:17.735.080 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:17.735.172 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:22.735.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:22.735.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:27.735.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:27.735.584 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:32.735.740 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:32.735.840 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:37.735.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:37.736.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:42.736.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:42.736.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:47.736.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:47.736.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:52.737.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:52.737.390 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:57.737.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:02:57.737.594 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:02.737.742 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:02.737.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:07.737.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:07.738.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:12.738.153 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:12.738.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:17.738.398 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:17.738.459 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:22.738.606 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:22.738.669 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:27.738.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:27.738.883 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:32.739.037 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:32.739.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:37.739.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:37.739.312 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:42.739.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:42.739.558 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:47.739.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:47.739.771 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:52.739.924 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:52.739.994 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:57.740.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:03:57.740.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:02.740.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:02.741.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:07.741.165 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:07.741.214 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:12.741.312 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:12.741.427 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:17.741.578 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:17.741.636 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:22.741.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:22.741.852 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:27.742.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:27.742.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:32.742.240 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:32.742.311 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:37.742.459 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:37.742.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:42.742.655 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:42.742.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:47.742.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:47.742.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:52.743.110 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:52.743.198 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:57.743.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:04:57.743.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:02.743.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:02.743.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:07.743.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:07.744.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:12.744.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:12.744.885 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:17.745.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:17.745.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:22.745.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:22.745.324 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:27.745.465 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:27.745.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:32.745.691 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:32.745.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:37.745.898 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:37.745.954 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:42.746.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:42.746.185 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:47.746.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:47.746.408 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:52.746.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:52.746.658 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:57.746.811 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:05:57.746.866 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:02.747.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:02.747.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:07.747.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:07.747.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:12.747.454 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:12.747.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:17.747.667 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:17.747.727 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:22.747.879 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:22.747.951 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:27.748.097 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:27.748.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:32.748.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:32.748.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:37.748.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:37.748.597 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:42.748.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:42.748.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:47.748.953 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:47.749.010 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:52.749.162 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:52.749.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:57.749.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:06:57.749.465 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:02.749.618 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:02.749.678 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:07.749.816 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:07.749.881 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:12.750.698 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:12.750.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:17.750.973 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:17.751.035 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:22.751.184 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:22.751.241 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:27.751.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:27.751.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:32.751.739 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:32.751.800 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:37.751.941 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:37.751.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:42.752.138 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:42.752.199 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:47.752.354 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:47.752.423 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:52.752.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:52.752.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:57.752.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:07:57.752.934 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:02.753.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:02.753.162 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:07.753.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:07.753.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:12.753.518 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:12.753.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:17.753.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:17.753.798 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:22.753.945 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:22.754.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:27.754.157 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:27.754.222 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:32.754.374 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:32.754.444 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:37.754.599 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:37.755.328 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:42.755.470 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:42.755.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:47.755.688 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:47.755.749 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:52.755.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:52.755.967 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:57.756.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:08:57.756.170 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:02.756.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:02.756.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:07.756.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:07.756.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:12.756.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:12.756.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:17.756.974 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:17.757.029 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:22.757.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:22.757.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:27.757.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:27.757.519 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:32.757.673 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:32.757.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:37.757.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:37.757.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:42.758.106 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:42.758.164 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:47.758.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:47.758.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:52.758.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:52.758.604 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:57.758.749 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:09:57.758.808 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:02.758.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:02.760.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:07.760.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:07.760.306 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:12.760.456 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:12.760.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:17.760.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:17.760.758 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:22.760.908 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:22.760.968 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:27.761.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:27.761.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:32.761.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:32.761.385 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:37.761.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:37.761.576 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:42.762.320 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:42.762.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:47.762.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:47.762.634 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:52.762.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:52.762.846 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:57.762.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:10:57.763.083 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:02.763.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:02.763.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:07.763.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:07.763.493 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:12.763.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:12.763.746 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:17.763.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:17.763.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:22.764.112 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:22.764.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:27.764.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:27.765.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:32.765.172 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:32.765.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:37.766.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:37.766.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:42.766.241 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:42.766.293 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:47.766.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:47.766.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:52.766.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:52.766.697 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:57.766.843 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:11:57.766.902 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:02.767.054 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:02.767.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:07.767.268 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:07.767.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:12.767.496 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:12.767.553 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:17.767.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:17.767.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:22.767.921 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:22.767.979 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:27.768.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:27.768.177 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:32.768.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:32.768.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:37.768.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:37.768.606 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:42.768.757 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:42.768.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:47.769.013 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:47.769.081 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:52.769.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:52.769.318 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:57.769.467 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:12:57.769.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:02.769.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:02.769.723 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:07.769.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:07.769.917 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:12.770.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:12.770.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:17.771.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:17.771.146 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:22.771.293 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:22.771.348 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:27.771.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:27.771.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:32.771.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:32.772.445 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:37.772.589 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:37.772.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:42.772.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:42.772.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:47.773.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:47.773.085 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:52.773.250 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:52.773.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:57.773.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:13:57.773.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:02.773.701 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:02.773.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:07.773.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:07.774.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:12.774.203 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:12.774.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:17.774.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:17.774.529 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:22.774.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:22.774.726 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:27.774.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:27.774.924 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:32.775.076 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:32.775.136 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:37.775.286 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:37.775.382 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:42.775.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:42.775.644 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:47.775.797 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:47.775.858 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:52.776.011 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:52.776.084 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:57.776.229 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:14:57.776.354 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:02.776.503 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:02.776.568 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:07.776.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:07.776.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:12.776.923 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:12.776.975 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:17.777.121 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:17.777.186 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:22.777.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:22.777.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:27.777.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:27.777.610 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:32.777.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:32.777.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:37.777.976 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:37.778.037 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:42.778.219 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:42.778.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:47.778.423 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:47.778.483 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:52.778.639 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:52.778.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:57.778.874 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:15:57.778.958 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:02.779.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:02.779.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:07.779.298 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:07.779.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:12.779.498 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:12.779.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:17.779.744 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:17.779.836 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:22.779.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:22.780.737 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:27.780.876 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:27.780.933 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:32.781.081 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:32.781.139 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:37.782.351 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:37.782.450 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:42.782.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:42.782.717 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:47.782.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:47.782.916 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:52.783.062 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:52.783.119 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:57.783.257 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:16:57.783.314 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:02.783.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:02.783.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:07.783.694 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:07.783.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:12.783.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:12.783.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:17.784.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:17.784.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:22.784.324 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:22.784.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:27.784.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:27.784.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:32.784.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:32.784.785 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:37.784.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:37.784.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:42.785.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:42.785.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:47.785.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:47.785.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:52.785.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:52.788.799 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:57.788.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:17:57.789.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:02.789.159 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:02.789.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:07.789.418 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:07.789.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:12.789.613 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:12.789.673 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:17.789.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:17.789.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:22.790.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:23.592.849 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:28.593.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:28.593.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:33.593.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:33.595.433 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:38.595.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:38.596.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:43.597.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:43.599.919 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:48.600.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:48.602.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:53.602.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:53.604.091 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:58.604.253 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:18:58.604.324 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:03.604.476 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:03.604.551 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:08.604.690 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:08.604.756 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:13.621.722 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:13.621.792 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:18.621.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:18.621.990 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:23.626.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:23.626.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:28.646.460 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:28.646.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:33.647.073 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:33.653.323 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:38.653.464 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:38.653.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:43.674.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:43.674.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:48.677.796 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:48.677.857 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:53.678.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:53.684.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:58.684.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:19:58.686.609 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:03.686.753 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:03.688.222 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:08.688.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:08.688.452 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:13.688.606 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:13.688.666 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:18.688.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:18.688.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:23.689.060 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:23.689.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:28.689.328 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:28.689.393 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:33.689.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:33.689.601 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:38.689.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:38.689.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:43.690.006 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:43.690.071 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:48.690.227 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:48.690.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:53.690.439 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:53.690.501 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:58.690.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:20:58.690.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:03.690.845 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:03.690.900 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:08.691.050 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:08.691.116 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:13.691.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:13.691.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:18.691.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:18.692.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:23.692.509 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:23.692.567 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:28.692.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:28.692.811 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:33.692.959 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:33.693.012 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:38.693.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:38.693.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:43.693.406 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:43.693.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:48.693.601 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:48.693.661 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:53.693.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:53.693.856 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:58.694.010 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:21:58.694.107 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:03.694.266 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:03.694.325 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:08.694.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:08.694.590 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:13.694.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:13.694.829 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:18.694.969 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:18.695.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:23.695.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:23.695.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:28.695.414 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:28.695.547 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:33.695.692 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:33.695.750 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:38.695.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:38.696.007 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:43.696.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:43.696.830 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:48.696.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:48.697.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:53.697.194 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:53.697.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:58.698.126 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:22:58.698.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:03.698.358 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:03.698.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:08.699.166 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:08.699.235 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:13.699.381 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:13.699.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:18.699.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:18.699.668 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:23.699.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:23.699.867 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:28.700.051 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:28.700.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:33.700.299 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:33.700.361 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:38.700.508 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:38.700.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:43.700.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:43.700.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:48.700.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:48.701.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:53.701.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:53.701.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:58.701.431 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:23:58.701.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:03.701.634 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:03.701.696 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:08.701.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:08.702.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:13.702.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:13.702.896 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:18.703.048 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:18.703.125 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:23.703.281 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:23.703.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:28.703.489 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:28.703.548 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:33.703.699 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:33.703.752 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:38.703.901 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:38.703.957 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:43.704.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:43.704.156 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:48.704.306 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:48.704.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:53.704.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:53.704.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:58.704.755 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:24:58.704.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:03.704.977 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:03.705.043 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:08.705.191 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:08.705.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:13.705.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:13.705.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:18.705.642 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:18.705.711 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:23.705.862 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:23.705.944 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:28.706.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:28.706.158 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:33.706.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:33.706.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:38.707.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:38.707.424 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:43.707.572 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:43.707.637 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:48.707.786 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:48.707.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:53.707.985 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:53.708.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:58.708.183 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:25:58.708.247 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:03.708.394 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:03.708.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:08.708.587 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:08.708.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:13.708.794 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:13.709.478 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:18.709.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:18.709.671 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:23.709.822 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:23.709.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:28.710.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:28.710.086 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:33.710.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:33.710.285 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:38.710.947 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:38.711.011 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:43.711.163 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:43.711.263 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:48.711.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:48.711.462 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:53.711.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:53.711.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:58.712.407 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:26:58.712.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:03.712.614 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:03.712.664 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:08.712.812 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:08.712.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:13.713.023 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:13.713.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:18.713.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:18.713.313 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:23.713.457 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:23.713.516 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:28.713.663 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:28.713.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:33.713.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:33.713.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:38.714.096 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:38.714.980 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:43.715.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:43.715.179 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:48.715.333 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:48.715.394 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:53.715.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:53.715.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:58.715.745 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:27:58.715.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:03.715.957 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:03.716.013 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:08.716.155 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:08.716.220 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:13.716.373 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:13.716.429 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:18.716.597 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:18.716.700 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:23.716.866 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:23.716.920 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:28.717.076 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:28.717.169 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:33.717.317 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:33.717.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:38.717.541 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:38.717.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:43.717.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:43.717.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:48.717.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:48.718.057 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:53.718.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:53.718.262 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:58.718.400 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:28:58.718.460 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:03.718.610 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:03.718.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:08.718.857 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:08.718.929 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:13.719.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:13.719.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:18.719.274 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:18.719.326 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:23.719.475 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:23.719.534 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:28.719.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:28.719.742 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:33.719.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:33.719.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:38.720.092 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:38.720.176 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:43.720.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:43.720.370 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:48.720.543 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:48.720.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:53.720.761 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:53.720.817 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:58.720.965 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:29:58.721.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:03.721.161 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:03.721.227 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:08.721.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:08.721.446 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:13.721.593 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:13.721.654 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:18.721.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:18.721.867 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:23.722.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:23.722.087 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:28.722.247 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:28.722.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:33.722.509 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:33.722.564 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:38.722.707 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:38.722.763 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:43.722.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:43.722.993 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:48.723.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:48.723.194 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:53.723.339 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:53.723.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:58.723.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:30:58.723.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:03.723.758 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:03.723.816 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:08.723.958 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:08.724.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:13.724.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:13.724.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:18.724.382 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:18.724.442 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:23.724.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:23.724.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:28.724.809 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:28.724.910 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:33.725.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:33.725.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:38.725.315 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:38.725.372 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:43.725.509 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:43.725.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:48.725.720 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:48.725.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:53.725.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:53.726.022 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:58.726.170 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:31:58.726.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:03.726.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:03.726.466 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:08.726.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:08.726.667 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:13.726.808 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:13.726.873 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:18.727.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:18.727.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:23.727.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:23.727.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:28.728.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:28.728.118 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:33.728.255 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:33.728.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:38.728.500 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:38.728.560 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:43.728.702 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:43.728.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:48.728.914 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:48.728.988 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:53.729.133 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:53.729.187 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:58.729.329 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:32:58.729.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:03.729.534 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:03.729.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:08.729.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:08.729.790 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:13.729.934 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:13.729.992 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:18.730.167 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:18.730.225 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:23.730.375 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:23.730.431 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:28.730.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:28.730.644 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:33.730.787 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:33.730.843 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:38.730.989 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:38.731.090 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:43.731.239 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:43.731.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:48.731.463 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:48.731.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:53.731.693 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:53.731.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:58.731.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:33:58.732.610 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:03.732.750 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:03.732.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:08.732.949 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:08.733.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:13.733.169 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:13.733.229 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:18.733.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:18.733.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:23.733.591 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:23.733.647 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:28.733.803 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:28.733.878 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:33.734.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:33.734.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:38.734.245 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:38.734.304 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:43.734.474 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:43.734.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:48.734.685 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:48.734.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:53.734.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:53.735.009 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:58.735.145 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:34:58.735.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:03.735.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:03.735.410 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:08.735.563 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:08.735.623 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:13.735.768 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:13.735.824 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:18.735.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:18.736.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:23.736.231 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:23.737.063 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:28.737.216 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:28.737.307 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:33.737.465 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:33.737.565 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:38.737.714 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:38.737.813 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:43.737.962 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:43.738.027 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:48.738.193 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:48.738.258 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:53.738.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:53.738.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:58.738.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:35:58.738.773 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:03.738.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:03.739.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:08.739.232 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:08.739.322 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:13.739.486 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:13.739.563 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:18.739.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:18.739.793 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:23.739.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:23.740.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:28.740.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:28.740.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:33.740.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:33.740.506 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:38.740.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:38.740.734 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:43.740.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:43.740.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:48.741.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:48.741.810 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:53.741.956 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:53.742.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:58.742.156 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:36:58.742.207 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:03.742.355 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:03.742.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:08.742.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:08.742.616 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:13.742.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:13.742.850 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:18.742.996 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:18.743.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:23.743.213 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:23.743.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:28.743.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:28.743.530 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:33.743.712 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:33.743.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:38.743.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:38.744.048 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:43.744.192 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:43.744.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:48.744.417 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:48.744.486 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:53.744.638 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:53.744.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:58.744.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:37:58.744.943 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:03.745.086 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:03.745.148 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:08.745.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:08.745.371 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:13.745.534 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:13.745.593 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:18.747.323 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:18.747.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:23.747.526 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:23.747.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:28.747.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:28.747.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:33.747.994 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:33.748.051 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:38.748.192 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:38.748.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:43.748.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:43.748.461 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:48.748.611 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:48.748.666 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:53.748.816 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:53.749.619 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:58.749.762 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:38:58.749.861 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:03.749.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:03.750.052 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:08.750.203 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:08.750.272 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:13.750.421 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:13.750.522 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:18.750.677 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:18.750.733 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:23.750.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:23.750.938 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:28.751.085 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:28.751.151 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:33.751.295 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:33.751.352 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:38.751.535 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:38.751.595 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:43.751.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:43.751.781 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:48.751.929 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:48.751.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:53.752.132 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:53.752.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:58.752.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:39:58.752.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:03.752.533 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:03.752.592 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:08.752.747 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:08.752.815 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:13.752.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:13.753.024 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:18.753.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:18.753.863 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:23.754.001 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:23.754.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:28.754.206 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:28.754.260 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:33.754.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:33.754.471 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:38.754.616 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:38.754.670 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:43.754.815 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:43.754.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:48.755.034 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:48.755.093 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:53.755.236 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:53.755.294 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:58.755.430 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:40:58.755.490 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:03.756.241 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:03.756.315 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:08.756.466 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:08.756.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:13.756.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:13.756.731 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:18.756.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:18.756.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:23.757.128 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:23.757.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:28.757.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:28.757.384 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:33.757.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:33.757.585 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:38.757.736 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:38.757.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:43.757.926 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:43.759.759 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:48.759.897 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:48.759.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:53.760.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:53.760.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:58.760.342 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:41:58.760.458 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:03.760.598 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:03.760.657 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:08.760.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:08.760.872 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:13.761.019 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:13.761.085 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:18.761.228 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:18.761.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:23.761.454 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:23.761.515 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:28.761.687 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:28.761.770 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:33.761.902 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:33.761.974 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:38.762.122 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:38.762.181 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:43.762.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:43.762.387 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:48.762.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:48.762.613 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:53.762.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:53.762.825 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:58.762.964 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:42:58.763.026 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:03.763.181 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:03.763.239 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:08.763.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:08.763.486 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:13.763.629 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:13.763.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:18.763.840 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:18.763.897 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:23.764.037 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:23.764.097 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:28.764.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:28.764.357 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:33.764.503 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:33.764.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:38.764.704 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:38.764.768 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:43.764.920 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:43.764.978 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:48.765.117 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:48.765.182 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:53.765.325 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:53.765.383 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:58.765.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:43:58.765.581 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:03.765.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:03.765.788 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:08.765.939 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:08.766.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:13.766.142 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:13.766.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:18.766.352 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:18.766.407 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:23.766.568 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:23.766.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:28.766.882 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:28.766.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:33.767.102 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:33.767.854 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:38.767.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:38.768.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:43.768.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:43.768.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:48.768.386 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:48.768.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:53.768.595 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:53.768.651 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:58.768.799 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:44:58.768.904 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:03.769.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:03.769.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:08.769.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:08.769.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:13.770.040 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:13.770.132 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:18.770.269 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:18.770.335 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:23.770.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:23.770.545 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:28.770.681 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:28.770.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:33.770.885 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:33.770.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:38.771.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:38.771.149 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:43.771.300 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:43.771.364 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:48.771.522 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:48.771.580 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:53.771.731 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:53.771.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:58.771.970 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:45:58.772.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:03.772.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:03.772.195 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:08.772.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:08.772.397 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:13.772.548 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:13.772.618 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:18.772.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:18.772.848 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:23.773.002 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:23.773.061 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:28.773.210 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:28.773.337 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:33.773.491 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:33.773.549 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:38.773.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:38.773.803 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:43.773.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:43.773.997 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:48.774.148 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:48.774.217 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:53.774.365 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:53.774.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:58.774.564 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:46:58.774.624 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:03.774.771 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:03.774.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:08.774.982 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:08.775.047 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:13.775.186 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:13.775.265 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:18.775.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:18.775.486 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:23.775.666 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:23.775.724 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:28.775.875 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:28.775.943 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:33.776.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:33.776.152 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:38.776.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:38.776.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:43.776.482 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:43.776.539 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:48.776.700 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:48.776.807 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:53.776.961 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:53.777.021 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:58.777.178 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:47:58.777.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:03.777.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:03.778.183 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:08.778.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:08.778.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:13.778.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:13.778.649 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:18.778.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:18.778.874 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:23.779.038 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:23.779.129 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:28.779.283 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:28.779.343 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:33.779.506 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:33.779.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:38.779.732 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:38.779.806 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:43.779.960 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:43.780.019 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:48.780.196 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:48.780.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:53.780.440 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:53.780.518 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:58.780.670 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:48:58.780.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:03.780.911 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:03.781.008 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:08.781.149 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:08.781.250 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:13.781.402 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:13.781.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:18.781.631 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:18.781.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:23.781.909 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:23.781.965 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:28.782.114 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:28.783.248 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:33.783.388 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:33.783.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:38.783.604 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:38.783.706 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:43.783.851 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:43.783.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:48.784.844 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:48.784.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:53.785.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:53.785.121 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:58.786.119 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:49:58.786.197 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:03.786.356 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:03.786.432 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:08.786.574 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:08.786.640 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:13.786.793 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:13.786.860 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:18.787.012 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:18.787.088 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:23.787.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:23.787.310 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:28.787.462 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:28.787.524 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:33.787.675 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:33.787.766 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:38.787.922 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:38.787.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:43.788.133 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:43.788.190 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:48.788.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:48.788.400 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:53.788.552 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:53.789.381 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:58.789.521 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:50:58.789.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:03.789.723 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:03.789.782 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:08.789.937 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:08.790.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:13.790.152 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:13.790.213 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:18.790.371 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:18.790.434 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:23.790.589 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:23.790.680 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:28.790.824 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:28.790.886 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:33.791.029 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:33.792.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:38.792.517 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:38.792.575 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:43.792.729 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:43.792.794 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:48.792.943 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:48.793.049 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:53.793.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:53.793.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:58.793.434 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:51:58.793.531 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:03.793.668 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:03.793.722 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:08.793.865 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:08.793.925 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:13.794.077 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:13.794.144 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:18.794.330 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:18.794.441 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:23.794.590 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:23.794.643 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:28.794.795 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:28.794.908 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:33.795.066 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:33.795.130 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:38.795.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:38.795.344 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:43.795.495 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:43.795.566 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:48.795.716 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:48.795.772 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:53.795.930 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:53.796.095 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:58.796.246 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:52:58.796.338 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:03.796.481 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:03.796.538 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:08.796.684 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:08.796.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:13.796.899 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:13.796.963 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:18.797.115 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:18.797.174 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:23.797.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:23.797.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:28.797.520 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:28.799.991 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:33.800.136 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:33.801.571 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:38.801.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:38.801.769 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:43.801.933 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:43.801.985 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:48.802.129 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:48.802.189 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:53.802.337 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:53.804.695 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:58.804.835 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:53:58.804.899 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:03.809.827 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:03.809.888 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:08.813.424 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:08.813.491 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:13.814.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:13.814.847 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:18.831.208 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:18.831.271 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:23.832.741 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:23.835.753 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:28.835.888 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:28.835.946 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:33.840.678 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:33.842.244 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:38.842.391 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:38.845.487 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:43.845.632 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:43.847.067 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:48.847.205 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:48.847.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:53.847.399 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:53.849.155 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:58.849.311 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:54:58.851.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:03.851.764 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:03.851.822 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:08.855.742 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:08.855.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:13.855.944 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:13.856.003 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:18.857.428 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:18.857.500 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:23.857.651 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:23.857.709 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:28.857.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:28.857.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:33.858.067 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:33.858.142 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:38.858.277 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:38.858.342 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:43.858.502 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:43.858.559 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:48.858.709 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:48.860.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:53.860.345 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:53.860.399 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:58.860.547 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:55:58.860.627 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:03.860.769 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:03.860.828 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:08.860.979 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:08.861.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:13.861.912 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:13.861.971 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:18.862.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:18.862.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:23.862.331 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:23.862.455 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:28.862.612 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:28.862.690 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:33.862.867 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:33.862.932 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:38.863.091 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:38.863.214 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:43.863.350 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:43.863.415 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:48.863.569 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:48.863.622 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:53.863.774 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:53.863.827 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:58.863.972 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:56:58.864.034 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:03.864.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:03.864.297 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:08.864.451 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:08.864.513 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:13.864.663 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:13.865.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:18.865.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:18.865.704 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:23.865.855 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:23.865.907 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:28.866.057 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:28.866.115 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:33.866.254 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:33.866.316 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:38.866.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:38.866.541 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:43.866.688 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:43.866.744 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:48.866.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:48.866.986 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:53.867.125 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:53.867.249 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:58.867.387 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:57:58.867.473 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:03.867.605 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:03.867.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:08.867.820 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:08.867.877 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:13.868.026 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:13.868.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:18.868.230 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:18.868.287 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:23.868.436 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:23.868.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:28.868.647 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:28.868.715 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:33.868.868 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:33.868.928 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:38.869.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:38.869.160 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:43.869.322 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:43.869.398 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:48.869.538 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:48.869.596 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:53.869.743 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:53.869.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:58.869.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:58:58.870.060 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:03.870.217 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:03.870.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:08.870.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:08.870.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:13.870.654 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:13.870.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:18.870.858 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:18.872.240 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:23.872.384 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:23.872.440 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:28.872.586 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:28.872.648 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:33.872.805 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:33.872.864 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:38.873.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:38.873.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:43.873.263 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:43.873.317 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:48.873.469 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:48.873.537 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:53.873.689 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:53.873.749 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:58.873.895 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-00:59:58.873.953 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:03.874.140 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:03.874.202 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:08.874.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:08.874.412 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:13.875.189 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:13.875.284 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:18.875.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:18.875.504 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:23.875.657 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:23.875.716 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:28.875.868 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:28.875.945 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:33.876.084 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:33.876.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:38.876.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:38.876.376 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:43.876.525 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:43.877.188 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:48.877.314 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:48.877.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:53.877.527 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:53.877.583 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:58.877.733 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:00:58.877.789 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:03.877.950 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:03.878.014 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:08.878.177 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:08.878.255 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:13.878.409 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:13.878.472 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:18.878.633 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:18.878.754 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:23.878.906 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:23.878.968 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:28.879.137 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:28.879.201 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:33.879.351 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:33.879.411 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:38.879.549 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:38.879.611 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:43.880.773 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:43.880.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:48.880.998 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:48.881.074 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:53.881.224 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:53.881.305 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:58.881.461 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:01:58.881.526 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:03.881.682 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:03.881.760 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:08.881.913 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:08.882.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:13.882.776 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:13.882.835 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:18.882.995 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:18.883.069 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:23.883.222 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:23.883.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:28.883.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:28.883.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:33.883.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:33.883.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:38.883.863 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:38.883.964 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:43.884.105 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:43.884.166 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:48.884.321 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:48.884.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:53.884.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:53.884.602 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:58.884.748 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:02:58.884.809 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:03.884.958 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:03.885.017 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:08.885.171 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:08.885.252 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:13.886.204 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:13.886.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:18.886.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:18.886.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:23.886.672 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:23.886.738 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:28.886.891 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:28.886.948 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:33.887.090 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:33.887.760 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:38.887.903 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:38.887.955 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:43.888.107 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:43.888.184 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:48.888.340 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:48.888.420 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:53.888.579 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:53.888.638 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:58.888.801 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:03:58.888.876 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:03.889.027 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:03.889.082 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:08.889.252 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:08.889.336 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:13.889.487 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:13.890.898 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:18.891.052 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:18.891.159 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:23.891.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:23.891.377 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:28.891.537 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:28.891.617 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:33.891.782 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:33.891.842 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:38.891.981 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:38.892.042 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:43.892.197 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:43.892.256 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:48.892.404 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:48.892.463 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:53.892.607 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:53.892.673 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:58.892.848 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:04:58.892.914 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:03.893.063 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:03.893.120 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:08.893.287 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:08.893.360 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:13.893.512 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:13.893.570 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:18.893.724 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:18.893.795 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:23.893.946 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:23.894.002 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:28.894.160 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:28.894.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:33.894.411 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:33.894.510 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:38.894.663 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:38.895.329 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:43.895.458 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:43.895.512 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:48.895.659 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:48.895.723 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:53.895.878 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:53.895.938 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:58.896.098 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:05:58.896.176 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:03.896.334 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:03.896.396 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:08.896.559 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:08.896.631 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:13.896.789 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:13.896.882 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:18.897.030 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:18.897.104 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:23.897.304 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:23.897.379 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:28.897.540 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:28.897.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:33.897.775 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:33.897.853 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:38.898.008 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:38.898.111 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:43.898.258 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:43.898.367 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:48.898.529 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:48.898.587 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:53.898.738 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:53.898.796 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:58.898.948 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:06:58.899.006 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:03.899.153 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:03.899.952 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:08.900.104 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:08.900.180 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:13.900.327 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:13.900.389 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:18.900.536 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:18.900.600 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:23.900.759 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:23.900.819 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:28.900.967 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:28.901.039 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:33.901.190 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:33.901.264 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:38.901.403 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:38.901.509 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:43.901.660 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:43.901.719 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:48.901.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:48.901.950 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:53.902.093 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:53.902.154 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:58.902.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:07:58.902.403 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:03.902.544 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:03.902.599 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:08.902.754 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:08.902.832 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:13.902.983 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:13.903.041 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:18.903.200 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:18.903.275 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:23.903.427 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:23.903.528 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:28.903.667 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:28.904.426 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:33.904.567 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:33.904.625 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:38.904.780 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:38.904.837 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:43.904.980 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:43.905.040 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:48.905.195 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:48.905.282 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:53.905.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:53.905.453 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:58.906.222 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:08:58.906.286 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:03.906.437 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:03.906.497 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:08.906.650 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:08.906.708 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:13.906.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:13.906.937 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:18.907.088 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:18.907.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:23.907.305 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:23.907.359 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:28.907.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:28.907.557 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:33.907.697 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:33.907.755 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:38.907.916 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:38.907.995 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:43.908.143 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:43.908.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:48.908.357 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:48.908.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:53.909.249 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:53.910.135 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:58.910.273 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:09:58.910.375 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:03.910.519 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:03.910.574 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:08.911.393 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:08.911.467 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:13.912.187 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:13.912.270 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:18.912.410 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:18.912.468 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:23.912.622 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:23.912.683 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:28.912.834 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:28.912.892 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:33.913.036 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:33.913.117 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:38.913.261 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:38.913.327 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:43.913.478 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:43.913.536 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:48.913.683 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:48.913.745 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:53.913.890 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:53.913.949 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:58.914.095 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:10:58.914.153 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:03.914.303 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:03.914.358 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:08.914.505 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:08.914.569 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:13.914.718 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:13.914.776 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:18.914.954 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:18.915.036 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:23.915.173 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:23.915.253 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:28.915.392 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:28.915.449 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:33.915.600 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:33.915.665 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:38.915.817 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:38.915.879 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:43.916.017 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:43.916.075 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:48.916.225 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:48.916.279 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:53.916.433 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:53.916.494 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:58.916.643 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:11:58.916.735 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:03.916.881 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:03.916.939 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:08.917.798 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:08.917.891 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:13.918.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:13.918.098 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:18.918.242 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:18.918.295 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:23.918.447 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:23.918.507 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:28.918.665 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:28.918.747 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:33.918.892 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:33.918.959 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:38.919.116 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:38.919.205 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:43.919.368 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:43.919.430 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:48.919.575 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:48.919.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:53.919.785 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:53.919.850 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:58.920.000 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:12:58.920.058 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:03.920.209 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:03.920.277 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:08.920.432 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:08.920.498 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:13.920.644 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:13.920.710 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:18.920.860 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:18.920.915 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:23.921.071 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:23.921.839 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:28.921.986 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:28.922.059 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:33.922.212 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:33.922.268 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:38.922.412 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:38.922.470 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:43.922.620 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:43.922.674 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:48.922.825 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:48.922.889 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:53.923.039 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:53.923.099 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:58.923.251 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:13:58.923.322 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:03.923.471 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:03.923.527 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:08.923.693 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:08.923.748 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:13.923.899 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:13.923.962 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:18.924.118 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:18.924.203 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:23.924.349 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:23.924.416 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:28.924.565 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:28.924.630 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:33.924.777 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:33.924.855 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:38.925.016 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:38.925.073 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:43.925.215 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 4 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:43.925.281 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-26-01:14:48.565.201 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 2 has unregistered. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:48.925.420 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:85] Finalize] The meta server node can not be finalized because there are still 3 alive nodes. +[WARNING] DISTRIBUTED(62168,ffff8786a010,python):2024-07-26-01:14:48.925.481 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:113] Finalize] This log means the cluster is successfully created. Retry to finalize the node and exit cluster... +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-26-01:14:50.076.292 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 0 has unregistered. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-26-01:14:50.229.915 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 3 has unregistered. +[WARNING] DISTRIBUTED(62168,fffd8a5bf1e0,python):2024-07-26-01:14:53.756.485 [mindspore/ccsrc/distributed/cluster/topology/meta_server_node.cc:295] ProcessUnregister] Node 1 has unregistered. +/arrow/cpp/src/arrow/filesystem/s3fs.cc:2598: arrow::fs::FinalizeS3 was not called even though S3 was initialized. This could lead to a segmentation fault at exit diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_0.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_0.log" new file mode 100644 index 00000000..84e657a9 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_0.log" @@ -0,0 +1,17099 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:19.322.068 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:20.323.096 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:23.323.274 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:26.323.451 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:26.323.872 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 0 rank id: 0 +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:51.655.388 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:51.658.571 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(62173,ffffa5590010,python):2024-07-25-18:09:53.366.475 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-25 18:09:53,369 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_0.ckpt' +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-25 18:09:53,405 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-25 18:09:53,405 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-25 18:09:53,406 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/MindFormers/mindformers/research/output' +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-25 18:09:53,408 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-25 18:09:53,408 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,408 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-25 18:09:53,408 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-25 18:09:53,408 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-25 18:09:53,409 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,409 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-25 18:09:53,409 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-25 18:09:53,409 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-25 18:09:53,409 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-25 18:09:53,416 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:1625 +2024-07-25 18:09:53,417 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:10, sink_size:2 +2024-07-25 18:09:53,417 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:1625 +2024-07-25 18:09:53,417 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-25 18:09:53,418 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-25 18:09:53,418 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-25 18:09:53,419 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-25 18:09:53,419 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:09:53.420.994 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:09:53.423.669 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-25 18:09:53,530 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:09:53.532.122 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:09:53.532.252 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-25 18:09:53,552 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,572 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,593 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,613 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,634 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,654 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,675 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,695 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,715 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:54,183 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,378 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +[INFO] 2024-07-25 18:09:54,379 [62173] [SDK] : Start to freeze model for delta, mode: lora, include list: None, exclude list: None +[INFO] 2024-07-25 18:09:54,380 [62173] [SDK] : Start to freeze model, include list: ['*'], exclude list: ['*mindpet_delta_lora*'] +[INFO] 2024-07-25 18:09:54,386 [62173] [SDK] : End to freeze model. +[INFO] 2024-07-25 18:09:54,386 [62173] [SDK] : End to freeze model for delta. +2024-07-25 18:09:54,400 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-25 18:09:54,401 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-25 18:09:54,401 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-25 18:09:54,401 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-25 18:09:54,406 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-25 18:09:54,410 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-25 18:09:54,509 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-25 18:09:54,509 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-25 18:09:54,515 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-25 18:09:54,517 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-25 18:09:54,518 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-25 18:09:54,519 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:29.191.906 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.356.784 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.358.757 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.359.285 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.511.926 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.572.835 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.647.999 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:35.911.345 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:36.494.469 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.682.60 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.748.406 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.749.346 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.749.819 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.928.058 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:37.998.895 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:38.628.98 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:38.243.809 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:38.835.638 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:39.458.054 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.355.33 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.365.10 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.369.90 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.185.555 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.248.163 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.307.997 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:40.463.810 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:41.387.37 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:41.639.323 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.232.163 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.233.116 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.233.596 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.417.732 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.488.095 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.575.464 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:42.794.329 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:43.392.228 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.832. [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.603.613 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.604.811 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.605.451 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.781.484 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.850.407 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:44.906.274 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:45.691.60 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:45.644.703 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:46.245.395 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:46.866.334 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:46.867.371 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:46.868.027 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:47.137.029 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:47.245.875 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:47.324.960 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:47.537.968 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:48.498.854 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:49.134.440 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:49.836.864 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:49.837.811 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:49.838.335 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:50.821.0 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:50.729.18 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:50.153.986 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:50.375.278 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:50.986.763 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:51.681.525 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.266.825 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.268.026 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.268.585 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.463.704 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.531.856 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.600.650 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:52.787.373 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:53.377.581 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.752.4 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.642.970 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.643.937 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.644.502 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.815.569 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.870.999 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:54.921.646 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:55.100.245 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:55.729.322 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:56.564.428 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.146.034 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.146.943 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.147.477 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.411.804 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.529.016 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.602.721 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:57.776.576 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:58.681.858 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:59.320.704 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:59.903.708 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:59.904.876 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:11:59.905.437 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:00.757.65 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:00.147.260 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:00.222.872 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:00.447.496 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:01.310.80 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:01.699.682 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.302.264 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.303.727 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.304.452 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.484.167 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.563.079 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.609.790 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:02.785.600 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:03.369.640 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.542.68 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.659.388 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.660.408 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.660.893 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.884.347 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:04.935.823 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:05.303.33 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:05.212.179 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:06.353.96 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:06.614.679 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.197.893 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.198.815 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.199.376 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.369.934 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.449.212 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.513.174 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:07.687.792 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:08.264.344 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:08.852.119 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.459.095 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.460.140 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.460.717 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.655.895 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.730.922 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.794.386 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:09.971.092 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:10.570.680 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:11.163.753 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:11.748.038 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:11.748.888 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:11.749.505 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:11.960.112 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:12.287.10 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:12.920.05 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:12.261.849 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:12.888.961 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:13.473.519 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.888.76 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.898.23 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.903.54 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.362.168 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.478.353 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.590.323 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:14.803.358 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:15.367.143 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:15.931.617 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.518.785 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.520.020 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.520.637 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.688.604 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.752.595 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:16.832.635 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:17.211.27 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:17.592.715 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:18.194.778 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:18.763.387 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:18.764.265 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:18.764.820 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:18.946.295 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:19.236.99 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:19.757.94 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:19.259.142 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:19.843.982 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:20.434.256 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.536.42 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.545.98 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.551.44 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.231.849 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.294.829 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.365.952 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:21.539.473 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:22.119.457 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.151.88 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.593.058 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.593.983 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.594.525 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.850.719 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.899.523 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:23.948.097 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:24.163.903 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:24.748.449 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:25.349.556 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:25.950.975 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:25.951.891 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:25.952.388 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:26.123.151 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:26.187.311 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:26.274.570 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:26.448.708 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:27.435.64 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:27.639.662 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.219.833 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.220.890 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.221.416 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.423.830 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.519.337 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.602.433 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:28.773.083 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:29.357.999 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:29.953.773 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.543.202 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.544.227 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.544.711 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.713.609 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.807.804 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:30.876.397 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:31.483.28 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:31.680.349 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:32.518.049 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.118.666 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.119.709 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.120.362 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.299.074 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.390.394 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.435.775 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:33.619.654 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:34.235.228 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:34.906.978 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.515.435 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.516.367 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.516.872 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.723.841 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.845.735 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:35.917.410 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:36.835.19 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:36.909.859 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:37.514.056 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.138.579 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.140.218 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.140.787 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.305.265 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.372.511 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.457.016 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:38.630.885 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:39.234.267 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:39.833.966 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.416.926 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.417.778 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.418.318 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.583.884 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.630.303 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.675.813 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:40.847.114 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:41.447.151 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.255.98 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.623.443 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.624.351 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.624.855 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.790.290 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.837.662 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:42.881.942 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:43.578.06 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:43.680.842 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:44.250.320 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:44.840.414 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:44.841.359 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:44.841.819 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:45.950.9 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:45.620.30 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:45.109.401 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:45.278.854 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:45.897.084 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:46.475.705 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.144.292 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.145.220 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.145.715 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.328.055 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.378.883 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.421.820 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:47.591.588 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:48.160.971 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:48.965.566 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.537.064 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.538.080 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.538.627 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.711.399 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.781.671 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:49.852.585 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:50.282.01 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:50.610.415 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:51.197.755 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:51.831.708 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:12:51.832.731 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:18.704.329 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:18.709.477 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:26.996.49 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:26.103.526 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:33.485.727 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:33.489.526 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:40.803.247 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:40.807.137 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:47.962.901 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:47.967.114 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:55.155.855 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:13:55.159.706 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:02.251.450 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:02.255.283 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:09.896.908 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:09.901.282 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:17.429.7 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:17.830.1 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:24.251.675 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:24.255.555 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:31.407.612 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:31.411.402 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:38.492.408 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:38.496.421 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:45.943.539 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:45.947.451 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:53.911.235 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:14:53.915.185 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:01.830.713 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:01.834.567 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:10.407.26 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:10.447.56 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:18.804.80 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:18.843.32 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:26.121.756 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:26.125.733 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:34.792.07 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:34.832.52 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:41.987.426 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:41.991.341 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:49.891.979 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:49.895.913 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:57.791.806 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:15:57.795.784 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:05.887.589 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:05.891.502 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:13.877.448 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:13.881.314 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:21.815.363 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:21.819.398 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:29.907.343 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:29.911.277 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:37.888.801 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:37.892.665 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:46.371.6 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:46.780.7 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:54.151.572 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:16:54.155.439 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:02.731.247 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:02.737.146 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:10.894.722 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:10.898.655 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:19.173.44 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:19.214.55 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:27.226.06 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:46.685.179 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:46.685.673 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-25 18:17:46,686 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-25 18:17:46,687 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +{'auto_trans_ckpt': False, + 'auto_tune': False, + 'autotune_per_step': 10, + 'callbacks': [OrderedDict([('type', 'MFLossMonitor')]), + OrderedDict([('type', 'CheckpointMointor'), + ('prefix', 'llama3_8b'), + ('save_checkpoint_steps', 1400), + ('integrated_save', False), + ('async_save', False)]), + OrderedDict([('type', 'ObsMonitor')])], + 'context': {'device_target': 'Ascend', + 'enable_graph_kernel': False, + 'graph_kernel_flags': '--disable_expand_ops=Softmax,Dropout ' + '--enable_parallel_fusion=true ' + '--reduce_fuse_depth=8 ' + '--enable_auto_tensor_inplace=true', + 'max_call_depth': 10000, + 'runtime_num_threads': 1, + 'save_graphs': False, + 'save_graphs_path': './graph'}, + 'data_size': 1625, + 'device_num': 4, + 'do_eval': False, + 'eval_callbacks': [OrderedDict([('type', 'ObsMonitor')])], + 'eval_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'eval_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '', + 'shuffle': False, + 'type': 'MindDataset'}, + 'do_eval': True, + 'drop_remainder': False, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'filepath_prefix': './autotune', + 'init_start_profile': False, + 'layer_decay': 0.65, + 'layer_scale': False, + 'load_checkpoint': '/home/ma-user/work/llama3-8B.ckpt', + 'local_rank': 0, + 'lr_scale_factor': 256, + 'lr_schedule': {'learning_rate': 3e-05, + 'lr_end': 1e-06, + 'total_steps': 16250, + 'type': 'CosineWithWarmUpLR', + 'warmup_steps': 1625}, + 'metric': [{'type': 'PerplexityMetric'}], + 'micro_batch_interleave_num': 1, + 'model': {'arch': {'type': 'LlamaForCausalLM'}, + 'model_config': {'batch_size': 1, + 'bos_token_id': 128000, + 'checkpoint_name_or_path': None, + 'compute_dtype': 'bfloat16', + 'do_sample': False, + 'eos_token_id': 128001, + 'extend_method': 'None', + 'fine_grain_interleave': 1, + 'hidden_size': 4096, + 'ignore_token_id': -100, + 'intermediate_size': 14336, + 'layernorm_compute_type': 'float32', + 'max_decode_length': 512, + 'n_kv_heads': 8, + 'num_heads': 32, + 'num_layers': 32, + 'offset': 0, + 'pad_token_id': 128002, + 'param_init_type': 'bfloat16', + 'pet_config': {'lora_alpha': 16, + 'lora_dropout': 0.05, + 'lora_rank': 8, + 'target_modules': '.*wq|.*wv'}, + 'repetition_penalty': 1, + 'rms_norm_eps': 1e-05, + 'rotary_dtype': 'float32', + 'scaling_factor': 1.0, + 'seq_length': 256, + 'softmax_compute_type': 'float32', + 'theta': 500000, + 'top_k': 3, + 'top_p': 1, + 'type': 'LlamaConfig', + 'use_flash_attention': True, + 'use_past': False, + 'vocab_size': 128256}}, + 'moe_config': , + 'only_save_strategy': False, + 'optimizer': {'beta1': 0.9, + 'beta2': 0.95, + 'eps': 1e-08, + 'type': 'FP32StateAdamWeightDecay'}, + 'output_dir': './output', + 'parallel': {'device_num': 4, + 'enable_alltoall': False, + 'enable_parallel_optimizer': True, + 'full_batch': True, + 'gradients_mean': False, + 'parallel_mode': 'semi_auto_parallel', + 'parallel_optimizer_config': {'gradient_accumulation_shard': False, + 'parallel_optimizer_threshold': 64}, + 'search_mode': 'sharding_propagation', + 'strategy_ckpt_config': {'only_trainable_params': False, + 'save_file': './ckpt_strategy.ckpt'}, + 'strategy_ckpt_save_file': './output/strategy/ckpt_strategy_rank_0.ckpt'}, + 'parallel_config': , + 'profile': False, + 'profile_communication': False, + 'profile_memory': True, + 'profile_start_step': 4, + 'profile_stop_step': 8, + 'rank_id': 0, + 'recompute_config': , + 'remote_save_url': '', + 'resume_training': False, + 'run_mode': 'finetune', + 'runner_config': {'batch_size': 32, + 'epochs': 8125, + 'gradient_accumulation_steps': 1, + 'initial_epoch': 0, + 'initial_step': 0, + 'origin_epochs': 10, + 'sink_mode': True, + 'sink_size': 2}, + 'runner_wrapper': {'scale_sense': 1.0, + 'type': 'MFTrainOneStepCell', + 'use_clip_grad': True}, + 'seed': 0, + 'src_strategy_path_or_dir': '', + 'train_dataset': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '/home/ma-user/work/train-fastchat256.mindrecord', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'train_dataset_task': {'dataset_config': {'auto_tune': False, + 'autotune_per_step': 10, + 'batch_size': 32, + 'data_loader': {'dataset_dir': '/home/ma-user/work/train-fastchat256.mindrecord', + 'shuffle': True, + 'type': 'MindDataset'}, + 'do_eval': False, + 'drop_remainder': True, + 'filepath_prefix': './autotune', + 'input_columns': ['input_ids', + 'labels'], + 'num_parallel_workers': 8, + 'numa_enable': False, + 'output_columns': ['input_ids', + 'labels'], + 'prefetch_size': 1, + 'profile': False, + 'python_multiprocessing': False, + 'repeat': 1, + 'seed': 0}, + 'type': 'CausalLanguageModelDataset'}, + 'trainer': {'model_name': 'llama3_8b', + 'type': 'CausalLanguageModelingTrainer'}, + 'use_parallel': True} +2024-07-25 18:17:46,693 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:46.694.223 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_end', 'epoch_begin', 'step_end', 'step_begin'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(62173:281473455816720,MainProcess):2024-07-25-18:17:46.694.356 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'epoch_end', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.781.629 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.782.603 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.783.450 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.784.236 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.785.085 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.785.910 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.786.678 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.787.474 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.788.243 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.788.973 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.789.769 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.790.510 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.791.218 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.791.981 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.792.749 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.793.543 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.794.332 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.795.150 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.795.999 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.796.792 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.797.709 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.798.499 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.799.309 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.800.083 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.800.815 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.801.600 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.802.400 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.803.189 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.804.014 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.804.855 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.805.700 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.806.591 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.807.202 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.808.113 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.809.033 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.810.053 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.811.451 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.813.326 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.815.795 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.818.614 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.822.519 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.823.986 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.824.912 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.825.826 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.826.669 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.827.528 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.828.281 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.829.073 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.829.890 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.830.690 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.831.504 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.832.254 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.833.034 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.833.812 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.834.621 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.835.475 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.836.328 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.837.283 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.838.274 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.839.282 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.840.231 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.841.259 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.842.164 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:18.843.142 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62173,ffffa5590010,python):2024-07-25-18:18:21.436.387 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | / 2024-07-25 18:28:34,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 2/ 1625], loss: 1.518, per_step_time: 323225ms, lr: 1.8461538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:34,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02475 samples/s/p 60 days, 18:49:35 } +2024-07-25 18:28:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 4/ 1625], loss: 1.444, per_step_time: 1583ms, lr: 5.538461e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.05236 samples/s/p 7:08:44 } +2024-07-25 18:28:41,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 6/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 9.230769e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:41,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.43121 samples/s/p 6:38:46 } +2024-07-25 18:28:44,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 8/ 1625], loss: 1.351, per_step_time: 1479ms, lr: 1.2923077e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:44,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.40661 samples/s/p 6:40:32 } +2024-07-25 18:28:47,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 10/ 1625], loss: 1.390, per_step_time: 1469ms, lr: 1.6615384e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:47,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.44349 samples/s/p 6:37:47 } +2024-07-25 18:28:50,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 12/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 2.0307691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:50,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43407 samples/s/p 6:38:25 } +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 14/ 1625], loss: 1.447, per_step_time: 1471ms, lr: 2.4e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:52,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43848 samples/s/p 6:38:03 } +2024-07-25 18:28:55,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 16/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.7692306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:55,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43088 samples/s/p 6:38:33 } +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 18/ 1625], loss: 1.406, per_step_time: 1474ms, lr: 3.1384613e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42696 samples/s/p 6:38:47 } +2024-07-25 18:29:01,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 20/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 3.5076923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:01,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43363 samples/s/p 6:38:15 } +2024-07-25 18:29:04,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 22/ 1625], loss: 1.420, per_step_time: 1474ms, lr: 3.876923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:04,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42672 samples/s/p 6:38:43 } +2024-07-25 18:29:07,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 24/ 1625], loss: 1.562, per_step_time: 1471ms, lr: 4.2461537e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:07,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43734 samples/s/p 6:37:53 } +2024-07-25 18:29:10,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 26/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 4.6153846e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43704 samples/s/p 6:37:51 } +2024-07-25 18:29:13,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 28/ 1625], loss: 1.523, per_step_time: 1471ms, lr: 4.9846153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:13,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43672 samples/s/p 6:37:50 } +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 30/ 1625], loss: 1.471, per_step_time: 1473ms, lr: 5.3538463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42859 samples/s/p 6:38:23 } +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 32/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 5.7230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43640 samples/s/p 6:37:45 } +2024-07-25 18:29:22,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 34/ 1625], loss: 1.483, per_step_time: 1472ms, lr: 6.092307e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:22,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43407 samples/s/p 6:37:53 } +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 36/ 1625], loss: 1.478, per_step_time: 1471ms, lr: 6.461538e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43732 samples/s/p 6:37:35 } +2024-07-25 18:29:28,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 38/ 1625], loss: 1.330, per_step_time: 1474ms, lr: 6.8307685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42612 samples/s/p 6:38:22 } +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 40/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 7.2e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42698 samples/s/p 6:38:15 } +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 42/ 1625], loss: 1.627, per_step_time: 1473ms, lr: 7.5692304e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43107 samples/s/p 6:37:54 } +2024-07-25 18:29:37,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 44/ 1625], loss: 1.519, per_step_time: 1471ms, lr: 7.9384614e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:37,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43744 samples/s/p 6:37:23 } +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 46/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 8.307692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:40,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43129 samples/s/p 6:37:47 } +2024-07-25 18:29:43,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 48/ 1625], loss: 1.576, per_step_time: 1471ms, lr: 8.676922e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:43,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43509 samples/s/p 6:37:27 } +2024-07-25 18:29:46,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 50/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 9.046154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:46,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42753 samples/s/p 6:37:58 } +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 52/ 1625], loss: 1.520, per_step_time: 1472ms, lr: 9.4153836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43214 samples/s/p 6:37:35 } +2024-07-25 18:29:52,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 54/ 1625], loss: 1.476, per_step_time: 1473ms, lr: 9.784615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:52,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43077 samples/s/p 6:37:38 } +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 56/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 1.0153847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:54,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42968 samples/s/p 6:37:39 } +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 58/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 1.0523077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:57,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42795 samples/s/p 6:37:44 } +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 60/ 1625], loss: 1.523, per_step_time: 1473ms, lr: 1.0892308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42775 samples/s/p 6:37:42 } +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 62/ 1625], loss: 1.416, per_step_time: 1473ms, lr: 1.1261538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:03,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43049 samples/s/p 6:37:27 } +2024-07-25 18:30:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 64/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.1630768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:06,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43170 samples/s/p 6:37:19 } +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 66/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 1.1999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43290 samples/s/p 6:37:11 } +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 68/ 1625], loss: 1.436, per_step_time: 1471ms, lr: 1.236923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43663 samples/s/p 6:36:51 } +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 70/ 1625], loss: 1.423, per_step_time: 1471ms, lr: 1.2738461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:15,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43803 samples/s/p 6:36:42 } +2024-07-25 18:30:18,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 72/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.3107691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:18,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43541 samples/s/p 6:36:51 } +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 74/ 1625], loss: 1.433, per_step_time: 1474ms, lr: 1.3476922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42407 samples/s/p 6:37:38 } +2024-07-25 18:30:24,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 76/ 1625], loss: 1.482, per_step_time: 1472ms, lr: 1.3846154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43182 samples/s/p 6:37:01 } +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 78/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.4215384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:27,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42810 samples/s/p 6:37:14 } +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 80/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 1.4584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43008 samples/s/p 6:37:02 } +2024-07-25 18:30:33,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 82/ 1625], loss: 1.471, per_step_time: 1474ms, lr: 1.4953846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42406 samples/s/p 6:37:26 } +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 84/ 1625], loss: 1.493, per_step_time: 1471ms, lr: 1.5323077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43525 samples/s/p 6:36:34 } +2024-07-25 18:30:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 86/ 1625], loss: 1.431, per_step_time: 1473ms, lr: 1.5692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42754 samples/s/p 6:37:05 } +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 88/ 1625], loss: 1.613, per_step_time: 1471ms, lr: 1.6061538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:42,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43720 samples/s/p 6:36:19 } +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 90/ 1625], loss: 1.673, per_step_time: 1483ms, lr: 1.6430769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.39324 samples/s/p 6:39:30 } +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 92/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 1.6799999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43734 samples/s/p 6:36:13 } +2024-07-25 18:30:51,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 94/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.716923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:51,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43618 samples/s/p 6:36:15 } +2024-07-25 18:30:54,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 96/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.753846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43662 samples/s/p 6:36:10 } +2024-07-25 18:30:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 98/ 1625], loss: 1.372, per_step_time: 1470ms, lr: 1.7907691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43998 samples/s/p 6:35:53 } +2024-07-25 18:30:59,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 100/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.8276922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:59,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43845 samples/s/p 6:35:56 } +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 102/ 1625], loss: 1.413, per_step_time: 1472ms, lr: 1.8646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:02,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43307 samples/s/p 6:36:17 } +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 104/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.9015384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43227 samples/s/p 6:36:17 } +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 106/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.9384615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.42694 samples/s/p 6:36:38 } +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 108/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 1.9753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43516 samples/s/p 6:35:59 } +2024-07-25 18:31:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 110/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.0123075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43716 samples/s/p 6:35:47 } +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 112/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.0492307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43744 samples/s/p 6:35:43 } +2024-07-25 18:31:20,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 114/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.0861537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:20,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43890 samples/s/p 6:35:34 } +2024-07-25 18:31:23,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 116/ 1625], loss: 1.443, per_step_time: 1471ms, lr: 2.1230767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:23,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43653 samples/s/p 6:35:41 } +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 118/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.16e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43610 samples/s/p 6:35:40 } +2024-07-25 18:31:29,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 120/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.1969229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:29,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43159 samples/s/p 6:35:57 } +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 122/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 2.233846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43221 samples/s/p 6:35:51 } +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 124/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 2.270769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43413 samples/s/p 6:35:40 } +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 126/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43742 samples/s/p 6:35:23 } +2024-07-25 18:31:41,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 128/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.3446153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:41,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43553 samples/s/p 6:35:28 } +2024-07-25 18:31:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 130/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.3815385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42519 samples/s/p 6:36:10 } +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 132/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.4184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43423 samples/s/p 6:35:28 } +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 134/ 1625], loss: 1.484, per_step_time: 1472ms, lr: 2.4553847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43413 samples/s/p 6:35:25 } +2024-07-25 18:31:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 136/ 1625], loss: 1.322, per_step_time: 1473ms, lr: 2.4923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:53,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42840 samples/s/p 6:35:47 } +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 138/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 2.5292306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43678 samples/s/p 6:35:08 } +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 140/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 2.5661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43379 samples/s/p 6:35:18 } +2024-07-25 18:32:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 142/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6030768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:01,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43218 samples/s/p 6:35:22 } +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 144/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.6399998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:04,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43313 samples/s/p 6:35:15 } +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 146/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.676923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43427 samples/s/p 6:35:07 } +2024-07-25 18:32:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 148/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.713846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:10,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43257 samples/s/p 6:35:11 } +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 150/ 1625], loss: 1.384, per_step_time: 1470ms, lr: 2.7507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43961 samples/s/p 6:34:38 } +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 152/ 1625], loss: 1.442, per_step_time: 1471ms, lr: 2.7876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43654 samples/s/p 6:34:48 } +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 154/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8246152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43401 samples/s/p 6:34:56 } +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 156/ 1625], loss: 1.473, per_step_time: 1471ms, lr: 2.8615384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:22,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43812 samples/s/p 6:34:35 } +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 158/ 1625], loss: 1.352, per_step_time: 1471ms, lr: 2.8984614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43579 samples/s/p 6:34:43 } +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 160/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9353844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.42742 samples/s/p 6:35:16 } +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 162/ 1625], loss: 1.487, per_step_time: 1472ms, lr: 2.9723076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43320 samples/s/p 6:34:48 } +2024-07-25 18:32:34,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 164/ 1625], loss: 1.285, per_step_time: 1470ms, lr: 3.0092306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:34,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43972 samples/s/p 6:34:17 } +2024-07-25 18:32:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 166/ 1625], loss: 1.387, per_step_time: 1472ms, lr: 3.0461536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43250 samples/s/p 6:34:45 } +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 168/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 3.0830768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43704 samples/s/p 6:34:22 } +2024-07-25 18:32:43,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 170/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 3.1199997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:43,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43090 samples/s/p 6:34:46 } +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 172/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 3.156923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43334 samples/s/p 6:34:33 } +2024-07-25 18:32:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 174/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.1938462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:49,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43181 samples/s/p 6:34:36 } +2024-07-25 18:32:52,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 176/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 3.2307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:52,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43326 samples/s/p 6:34:27 } +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 178/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.2676921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43439 samples/s/p 6:34:19 } +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 180/ 1625], loss: 1.463, per_step_time: 1471ms, lr: 3.3046153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43548 samples/s/p 6:34:12 } +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 182/ 1625], loss: 1.410, per_step_time: 1473ms, lr: 3.3415383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:00,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42925 samples/s/p 6:34:36 } +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 184/ 1625], loss: 1.516, per_step_time: 1470ms, lr: 3.3784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43926 samples/s/p 6:33:49 } +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 186/ 1625], loss: 1.353, per_step_time: 1473ms, lr: 3.4153845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42931 samples/s/p 6:34:30 } +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 188/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 3.4523075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43459 samples/s/p 6:34:04 } +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 190/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 3.4892307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43215 samples/s/p 6:34:11 } +2024-07-25 18:33:15,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 192/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 3.5261537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:15,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.42777 samples/s/p 6:34:27 } +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 194/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 3.5630767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43231 samples/s/p 6:34:05 } +2024-07-25 18:33:21,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 196/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 3.6e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:21,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43582 samples/s/p 6:33:46 } +2024-07-25 18:33:24,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 198/ 1625], loss: 1.411, per_step_time: 1473ms, lr: 3.6369229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:24,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43056 samples/s/p 6:34:06 } +2024-07-25 18:33:27,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 200/ 1625], loss: 1.502, per_step_time: 1472ms, lr: 3.6738459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:27,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43428 samples/s/p 6:33:47 } +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 202/ 1625], loss: 1.411, per_step_time: 1471ms, lr: 3.710769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43606 samples/s/p 6:33:37 } +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 204/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.747692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43344 samples/s/p 6:33:45 } +2024-07-25 18:33:36,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 206/ 1625], loss: 1.352, per_step_time: 1473ms, lr: 3.784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:36,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42824 samples/s/p 6:34:05 } +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 208/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 3.8215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43371 samples/s/p 6:33:38 } +2024-07-25 18:33:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 210/ 1625], loss: 1.391, per_step_time: 1473ms, lr: 3.8584612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42982 samples/s/p 6:33:52 } +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 212/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 3.8953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43857 samples/s/p 6:33:11 } +2024-07-25 18:33:48,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 214/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 3.932307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:48,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42636 samples/s/p 6:34:01 } +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 216/ 1625], loss: 1.471, per_step_time: 1470ms, lr: 3.969231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.44089 samples/s/p 6:32:55 } +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 218/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 4.0061536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42792 samples/s/p 6:33:48 } +2024-07-25 18:33:57,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 220/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.043077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:57,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43741 samples/s/p 6:33:04 } +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 222/ 1625], loss: 1.240, per_step_time: 1474ms, lr: 4.0799996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42601 samples/s/p 6:33:51 } +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 224/ 1625], loss: 1.427, per_step_time: 1471ms, lr: 4.116923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43699 samples/s/p 6:33:00 } +2024-07-25 18:34:05,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 226/ 1625], loss: 1.358, per_step_time: 1471ms, lr: 4.153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:05,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43694 samples/s/p 6:32:57 } +2024-07-25 18:34:08,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 228/ 1625], loss: 1.477, per_step_time: 1471ms, lr: 4.1907692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:08,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43624 samples/s/p 6:32:58 } +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 230/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 4.227692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:11,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42593 samples/s/p 6:33:39 } +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 232/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.264615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43282 samples/s/p 6:33:07 } +2024-07-25 18:34:17,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 234/ 1625], loss: 1.391, per_step_time: 1472ms, lr: 4.301538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:17,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43216 samples/s/p 6:33:06 } +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 236/ 1625], loss: 1.328, per_step_time: 1475ms, lr: 4.338461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42331 samples/s/p 6:33:42 } +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 238/ 1625], loss: 1.468, per_step_time: 1472ms, lr: 4.375385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43424 samples/s/p 6:32:52 } +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 240/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 4.4123076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:26,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43441 samples/s/p 6:32:48 } +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 242/ 1625], loss: 1.520, per_step_time: 1475ms, lr: 4.449231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:29,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42277 samples/s/p 6:33:35 } +2024-07-25 18:34:32,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 244/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 4.4861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:32,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42931 samples/s/p 6:33:04 } +2024-07-25 18:34:35,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 246/ 1625], loss: 1.449, per_step_time: 1473ms, lr: 4.5230768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43066 samples/s/p 6:32:55 } +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 248/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 4.5599995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43821 samples/s/p 6:32:20 } +2024-07-25 18:34:41,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 250/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 4.596923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:41,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43019 samples/s/p 6:32:51 } +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 252/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 4.633846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43541 samples/s/p 6:32:26 } +2024-07-25 18:34:47,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 254/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 4.670769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:47,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43181 samples/s/p 6:32:39 } +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 256/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 4.707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.44299 samples/s/p 6:31:47 } +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 258/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 4.744615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43464 samples/s/p 6:32:20 } +2024-07-25 18:34:56,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 260/ 1625], loss: 1.525, per_step_time: 1471ms, lr: 4.7815383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:56,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43777 samples/s/p 6:32:04 } +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 262/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.8184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43164 samples/s/p 6:32:27 } +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 264/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 4.8553843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43106 samples/s/p 6:32:27 } +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 266/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 4.8923075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43312 samples/s/p 6:32:15 } +2024-07-25 18:35:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 268/ 1625], loss: 1.425, per_step_time: 1472ms, lr: 4.9292303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43144 samples/s/p 6:32:19 } +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 270/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.9661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43540 samples/s/p 6:31:59 } +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 272/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 5.0030767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43467 samples/s/p 6:32:00 } +2024-07-25 18:35:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 274/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 5.04e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.42989 samples/s/p 6:32:17 } +2024-07-25 18:35:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 276/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.0769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43627 samples/s/p 6:31:47 } +2024-07-25 18:35:22,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 278/ 1625], loss: 1.270, per_step_time: 1475ms, lr: 5.113846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.42365 samples/s/p 6:32:39 } +2024-07-25 18:35:25,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 280/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 5.150769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43536 samples/s/p 6:31:45 } +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 282/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 5.187692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43581 samples/s/p 6:31:40 } +2024-07-25 18:35:31,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 284/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 5.2246155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:31,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43487 samples/s/p 6:31:41 } +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 286/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 5.2615383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:34,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43676 samples/s/p 6:31:30 } +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 288/ 1625], loss: 1.358, per_step_time: 1471ms, lr: 5.2984615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:37,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43708 samples/s/p 6:31:26 } +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 290/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 5.3353842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43573 samples/s/p 6:31:29 } +2024-07-25 18:35:43,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 292/ 1625], loss: 1.333, per_step_time: 1473ms, lr: 5.3723074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42760 samples/s/p 6:32:01 } +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 294/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 5.4092307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42675 samples/s/p 6:32:02 } +2024-07-25 18:35:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 296/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 5.446154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:49,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43360 samples/s/p 6:31:29 } +2024-07-25 18:35:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 298/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 5.4830766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:52,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43320 samples/s/p 6:31:28 } +2024-07-25 18:35:55,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 300/ 1625], loss: 1.461, per_step_time: 1473ms, lr: 5.52e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:55,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42934 samples/s/p 6:31:41 } +2024-07-25 18:35:58,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 302/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 5.5569226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:58,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43818 samples/s/p 6:31:00 } +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 304/ 1625], loss: 1.507, per_step_time: 1472ms, lr: 5.593846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43369 samples/s/p 6:31:17 } +2024-07-25 18:36:04,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 306/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 5.630769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:04,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43702 samples/s/p 6:30:59 } +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 308/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 5.667692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43778 samples/s/p 6:30:53 } +2024-07-25 18:36:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 310/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 5.704615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:09,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43607 samples/s/p 6:30:58 } +2024-07-25 18:36:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 312/ 1625], loss: 1.359, per_step_time: 1473ms, lr: 5.741538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:12,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43106 samples/s/p 6:31:16 } +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 314/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 5.778461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43747 samples/s/p 6:30:46 } +2024-07-25 18:36:18,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 316/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 5.8153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:18,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43829 samples/s/p 6:30:39 } +2024-07-25 18:36:21,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 318/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 5.8523074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43653 samples/s/p 6:30:44 } +2024-07-25 18:36:24,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 320/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 5.8892306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:24,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43415 samples/s/p 6:30:51 } +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 5.926154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:27,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43175 samples/s/p 6:30:59 } +2024-07-25 18:36:30,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 324/ 1625], loss: 1.425, per_step_time: 1470ms, lr: 5.9630765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:30,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43973 samples/s/p 6:30:21 } +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 326/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 5.9999998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:33,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43950 samples/s/p 6:30:19 } +2024-07-25 18:36:36,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 328/ 1625], loss: 1.466, per_step_time: 1472ms, lr: 6.036923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43332 samples/s/p 6:30:43 } +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 330/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 6.073846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:39,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43665 samples/s/p 6:30:26 } +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 332/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 6.110769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43201 samples/s/p 6:30:43 } +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 334/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 6.147692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43274 samples/s/p 6:30:37 } +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 336/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 6.184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43111 samples/s/p 6:30:41 } +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 338/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 6.221538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43757 samples/s/p 6:30:10 } +2024-07-25 18:36:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 340/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 6.2584613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.42807 samples/s/p 6:30:48 } +2024-07-25 18:36:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 342/ 1625], loss: 1.366, per_step_time: 1470ms, lr: 6.2953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:57,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43893 samples/s/p 6:29:58 } +2024-07-25 18:37:00,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 344/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.3323073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:00,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43189 samples/s/p 6:30:26 } +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 346/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 6.3692305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43032 samples/s/p 6:30:29 } +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 348/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 6.4061533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43244 samples/s/p 6:30:17 } +2024-07-25 18:37:08,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 350/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 6.443077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:08,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43701 samples/s/p 6:29:55 } +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 352/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 6.4799997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:11,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43354 samples/s/p 6:30:07 } +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 354/ 1625], loss: 1.081, per_step_time: 1474ms, lr: 6.516923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:14,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42734 samples/s/p 6:30:31 } +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 356/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 6.5538457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43907 samples/s/p 6:29:37 } +2024-07-25 18:37:20,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 358/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 6.590769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:20,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43374 samples/s/p 6:29:57 } +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 360/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 6.6276916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:23,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42590 samples/s/p 6:30:28 } +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 362/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 6.6646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43672 samples/s/p 6:29:38 } +2024-07-25 18:37:29,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 364/ 1625], loss: 1.370, per_step_time: 1474ms, lr: 6.7015385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:29,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42632 samples/s/p 6:30:20 } +2024-07-25 18:37:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 366/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 6.7384613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43926 samples/s/p 6:29:22 } +2024-07-25 18:37:35,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 368/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 6.7753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:35,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.42757 samples/s/p 6:30:09 } +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 370/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 6.812307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43952 samples/s/p 6:29:15 } +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 372/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 6.8492304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43683 samples/s/p 6:29:23 } +2024-07-25 18:37:44,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 374/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 6.8861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:44,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43601 samples/s/p 6:29:24 } +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 376/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 6.923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43777 samples/s/p 6:29:13 } +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 378/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 6.9599996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43602 samples/s/p 6:29:18 } +2024-07-25 18:37:53,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 380/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 6.996923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43704 samples/s/p 6:29:10 } +2024-07-25 18:37:56,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 382/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 7.0338456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:56,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42981 samples/s/p 6:29:39 } +2024-07-25 18:37:59,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 384/ 1625], loss: 1.384, per_step_time: 1473ms, lr: 7.0707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:59,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42880 samples/s/p 6:29:40 } +2024-07-25 18:38:02,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 386/ 1625], loss: 1.272, per_step_time: 1474ms, lr: 7.107692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:02,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42413 samples/s/p 6:29:57 } +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 388/ 1625], loss: 1.170, per_step_time: 1483ms, lr: 7.144615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.39142 samples/s/p 6:32:16 } +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 390/ 1625], loss: 1.440, per_step_time: 1471ms, lr: 7.181538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43687 samples/s/p 6:28:56 } +2024-07-25 18:38:10,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 392/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 7.218461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:10,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43733 samples/s/p 6:28:52 } +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 394/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 7.255384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42974 samples/s/p 6:29:21 } +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 396/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 7.2923076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42894 samples/s/p 6:29:22 } +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 398/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 7.3292304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.44045 samples/s/p 6:28:29 } +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 400/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 7.3661536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43016 samples/s/p 6:29:11 } +2024-07-25 18:38:25,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 402/ 1625], loss: 1.334, per_step_time: 1474ms, lr: 7.4030763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:25,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.42438 samples/s/p 6:29:32 } +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 404/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 7.4399995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43541 samples/s/p 6:28:42 } +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 406/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 7.4769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:31,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43995 samples/s/p 6:28:20 } +2024-07-25 18:38:34,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 408/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 7.5138464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:34,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43341 samples/s/p 6:28:45 } +2024-07-25 18:38:37,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 410/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 7.5507687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:37,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43353 samples/s/p 6:28:41 } +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 412/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 7.587692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43650 samples/s/p 6:28:26 } +2024-07-25 18:38:43,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 414/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 7.624615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43906 samples/s/p 6:28:12 } +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 416/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 7.661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43966 samples/s/p 6:28:06 } +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 418/ 1625], loss: 1.314, per_step_time: 1470ms, lr: 7.698461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:49,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44130 samples/s/p 6:27:56 } +2024-07-25 18:38:52,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 420/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 7.735384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:52,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43634 samples/s/p 6:28:15 } +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 422/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 7.772307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44133 samples/s/p 6:27:50 } +2024-07-25 18:38:58,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 424/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 7.809231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:58,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.42428 samples/s/p 6:29:00 } +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 426/ 1625], loss: 1.136, per_step_time: 1476ms, lr: 7.8461535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.41663 samples/s/p 6:29:30 } +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 428/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 7.883076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43210 samples/s/p 6:28:21 } +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 430/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.92e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44227 samples/s/p 6:27:35 } +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 432/ 1625], loss: 1.374, per_step_time: 1472ms, lr: 7.956923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43153 samples/s/p 6:28:18 } +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 434/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 7.993845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43846 samples/s/p 6:27:45 } +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 436/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 8.030769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.44241 samples/s/p 6:27:25 } +2024-07-25 18:39:18,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 438/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 8.067692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:18,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43296 samples/s/p 6:28:03 } +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 440/ 1625], loss: 1.366, per_step_time: 1471ms, lr: 8.1046155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43595 samples/s/p 6:27:47 } +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 442/ 1625], loss: 1.638, per_step_time: 1472ms, lr: 8.141537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43475 samples/s/p 6:27:49 } +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 444/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.178461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:27,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43797 samples/s/p 6:27:32 } +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 446/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43737 samples/s/p 6:27:32 } +2024-07-25 18:39:33,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 448/ 1625], loss: 1.467, per_step_time: 1472ms, lr: 8.252307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:33,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43167 samples/s/p 6:27:53 } +2024-07-25 18:39:36,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 450/ 1625], loss: 1.318, per_step_time: 1473ms, lr: 8.289231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42891 samples/s/p 6:28:02 } +2024-07-25 18:39:39,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 452/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 8.326153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:39,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.44116 samples/s/p 6:27:07 } +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 454/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 8.363077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43988 samples/s/p 6:27:09 } +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 456/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.399999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43335 samples/s/p 6:27:34 } +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 458/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 8.436923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42871 samples/s/p 6:27:51 } +2024-07-25 18:39:51,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 460/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 8.473846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:51,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43456 samples/s/p 6:27:23 } +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 462/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 8.510769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43172 samples/s/p 6:27:33 } +2024-07-25 18:39:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 464/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 8.547692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:57,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43803 samples/s/p 6:27:03 } +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 466/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 8.584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43724 samples/s/p 6:27:03 } +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 468/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 8.621538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:03,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43678 samples/s/p 6:27:02 } +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 470/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.658461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43662 samples/s/p 6:27:00 } +2024-07-25 18:40:09,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 472/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 8.695384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:09,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43444 samples/s/p 6:27:06 } +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 474/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 8.732308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:11,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43540 samples/s/p 6:26:59 } +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 476/ 1625], loss: 1.107, per_step_time: 1475ms, lr: 8.76923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42091 samples/s/p 6:27:58 } +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 478/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 8.806153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42958 samples/s/p 6:27:18 } +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 480/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 8.843077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.44059 samples/s/p 6:26:28 } +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 482/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 8.88e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:23,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43180 samples/s/p 6:27:03 } +2024-07-25 18:40:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 484/ 1625], loss: 1.342, per_step_time: 1476ms, lr: 8.9169225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.41673 samples/s/p 6:28:04 } +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 486/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 8.953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43753 samples/s/p 6:26:32 } +2024-07-25 18:40:32,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 488/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.990769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:32,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43172 samples/s/p 6:26:54 } +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 490/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 9.027692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43801 samples/s/p 6:26:24 } +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 492/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.064615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43273 samples/s/p 6:26:44 } +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 494/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.101538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43494 samples/s/p 6:26:32 } +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 496/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 9.138461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43791 samples/s/p 6:26:16 } +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 498/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.175385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:47,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43222 samples/s/p 6:26:37 } +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 500/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 9.212307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43505 samples/s/p 6:26:22 } +2024-07-25 18:40:53,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 502/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 9.24923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:53,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43286 samples/s/p 6:26:29 } +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 504/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 9.286154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43169 samples/s/p 6:26:31 } +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 506/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 9.3230765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43296 samples/s/p 6:26:22 } +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 508/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 9.36e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43947 samples/s/p 6:25:52 } +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 510/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 9.396922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43729 samples/s/p 6:25:58 } +2024-07-25 18:41:08,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 512/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 9.433846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:08,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44268 samples/s/p 6:25:32 } +2024-07-25 18:41:11,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 514/ 1625], loss: 1.214, per_step_time: 1474ms, lr: 9.470769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:11,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42559 samples/s/p 6:26:42 } +2024-07-25 18:41:13,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 516/ 1625], loss: 1.314, per_step_time: 1480ms, lr: 9.507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:13,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.40333 samples/s/p 6:28:15 } +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 518/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 9.544615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43989 samples/s/p 6:25:35 } +2024-07-25 18:41:19,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 520/ 1625], loss: 1.191, per_step_time: 1475ms, lr: 9.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:19,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42074 samples/s/p 6:26:54 } +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 522/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 9.618461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43376 samples/s/p 6:25:55 } +2024-07-25 18:41:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 524/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 9.655385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:25,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43589 samples/s/p 6:25:43 } +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 526/ 1625], loss: 1.433, per_step_time: 1471ms, lr: 9.692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:28,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43531 samples/s/p 6:25:43 } +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 528/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 9.72923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43949 samples/s/p 6:25:22 } +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 530/ 1625], loss: 1.409, per_step_time: 1470ms, lr: 9.766153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43860 samples/s/p 6:25:23 } +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 532/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 9.803077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:37,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43964 samples/s/p 6:25:16 } +2024-07-25 18:41:40,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 534/ 1625], loss: 1.323, per_step_time: 1470ms, lr: 9.839999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:40,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.44173 samples/s/p 6:25:04 } +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 536/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 9.876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:43,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43580 samples/s/p 6:25:26 } +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 538/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 9.913846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43341 samples/s/p 6:25:33 } +2024-07-25 18:41:49,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 540/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 9.950769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:49,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43770 samples/s/p 6:25:12 } +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 542/ 1625], loss: 1.315, per_step_time: 1475ms, lr: 9.9876925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.42356 samples/s/p 6:26:10 } +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 544/ 1625], loss: 1.386, per_step_time: 1472ms, lr: 1.0024614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43287 samples/s/p 6:25:27 } +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 546/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 1.0061538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43150 samples/s/p 6:25:30 } +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 548/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.0098462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43299 samples/s/p 6:25:20 } +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 550/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.0135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43381 samples/s/p 6:25:14 } +2024-07-25 18:42:07,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 552/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.0172307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:07,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43618 samples/s/p 6:25:01 } +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 554/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.020923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43521 samples/s/p 6:25:02 } +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 556/ 1625], loss: 1.024, per_step_time: 1473ms, lr: 1.0246154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.42973 samples/s/p 6:25:23 } +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 558/ 1625], loss: 1.404, per_step_time: 1472ms, lr: 1.0283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:15,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43340 samples/s/p 6:25:04 } +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 560/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 1.0319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43203 samples/s/p 6:25:07 } +2024-07-25 18:42:21,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 562/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.0356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:21,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43394 samples/s/p 6:24:56 } +2024-07-25 18:42:24,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 564/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 1.03938455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:24,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.44036 samples/s/p 6:24:26 } +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 566/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.0430769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43920 samples/s/p 6:24:28 } +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 568/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43694 samples/s/p 6:24:34 } +2024-07-25 18:42:33,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 570/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:33,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43230 samples/s/p 6:24:51 } +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 572/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.0541538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42795 samples/s/p 6:25:07 } +2024-07-25 18:42:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 574/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.0578461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:39,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43320 samples/s/p 6:24:41 } +2024-07-25 18:42:42,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 576/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 1.0615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:42,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42614 samples/s/p 6:25:08 } +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 578/ 1625], loss: 1.248, per_step_time: 1475ms, lr: 1.0652307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42332 samples/s/p 6:25:17 } +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 580/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.068923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43430 samples/s/p 6:24:28 } +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 582/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.0726154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43430 samples/s/p 6:24:25 } +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 584/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.0763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:54,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43428 samples/s/p 6:24:22 } +2024-07-25 18:42:57,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 586/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.07999995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:57,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43806 samples/s/p 6:24:03 } +2024-07-25 18:43:00,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 588/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0836922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:00,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43680 samples/s/p 6:24:05 } +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 590/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 1.0873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42952 samples/s/p 6:24:33 } +2024-07-25 18:43:06,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 592/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.091077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:06,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43578 samples/s/p 6:24:04 } +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 594/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 1.0947691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43265 samples/s/p 6:24:14 } +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 596/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.0984615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42906 samples/s/p 6:24:26 } +2024-07-25 18:43:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 598/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.1021538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43453 samples/s/p 6:24:00 } +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 600/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.10584615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:17,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42932 samples/s/p 6:24:19 } +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 602/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.1095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43681 samples/s/p 6:23:45 } +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 604/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.1132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43826 samples/s/p 6:23:36 } +2024-07-25 18:43:26,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 606/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.1169231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:26,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43759 samples/s/p 6:23:36 } +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 608/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.1206153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43441 samples/s/p 6:23:46 } +2024-07-25 18:43:32,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 610/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.1243076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:32,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43705 samples/s/p 6:23:32 } +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 612/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.1279999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43634 samples/s/p 6:23:32 } +2024-07-25 18:43:38,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 614/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.1316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:38,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43229 samples/s/p 6:23:46 } +2024-07-25 18:43:41,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 616/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1353846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:41,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43738 samples/s/p 6:23:22 } +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 618/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.1390768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:44,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43826 samples/s/p 6:23:15 } +2024-07-25 18:43:47,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 620/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.1427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:47,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43289 samples/s/p 6:23:35 } +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 622/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 1.14646145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:50,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43372 samples/s/p 6:23:28 } +2024-07-25 18:43:53,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 624/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.1501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:53,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.42405 samples/s/p 6:24:06 } +2024-07-25 18:43:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 626/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.1538462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43995 samples/s/p 6:22:56 } +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 628/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.1575384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43432 samples/s/p 6:23:17 } +2024-07-25 18:44:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 630/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 1.1612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:02,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43214 samples/s/p 6:23:23 } +2024-07-25 18:44:05,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 632/ 1625], loss: 1.094, per_step_time: 1476ms, lr: 1.164923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:05,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.41973 samples/s/p 6:24:13 } +2024-07-25 18:44:08,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 634/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.1686154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:08,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43518 samples/s/p 6:23:05 } +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 636/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.1723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43254 samples/s/p 6:23:13 } +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 638/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1759999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43487 samples/s/p 6:23:00 } +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 640/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.1796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44130 samples/s/p 6:22:30 } +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 642/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43501 samples/s/p 6:22:54 } +2024-07-25 18:44:22,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 644/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 1.18707685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:22,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43199 samples/s/p 6:23:03 } +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 646/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 1.1907691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.44004 samples/s/p 6:22:26 } +2024-07-25 18:44:28,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 648/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.1944615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:28,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43868 samples/s/p 6:22:29 } +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 650/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.1981539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43619 samples/s/p 6:22:37 } +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 652/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.201846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:34,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43105 samples/s/p 6:22:56 } +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 654/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.2055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43343 samples/s/p 6:22:43 } +2024-07-25 18:44:40,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 656/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.2092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:40,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43563 samples/s/p 6:22:30 } +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 658/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.21292305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:43,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43380 samples/s/p 6:22:35 } +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 660/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.2166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43915 samples/s/p 6:22:10 } +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 662/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.2203076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42998 samples/s/p 6:22:45 } +2024-07-25 18:44:52,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 664/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 1.224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:52,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43977 samples/s/p 6:22:01 } +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 666/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.22769225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42980 samples/s/p 6:22:40 } +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 668/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.2313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43425 samples/s/p 6:22:18 } +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 670/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2350769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43320 samples/s/p 6:22:20 } +2024-07-25 18:45:04,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 672/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.2387692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:04,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43179 samples/s/p 6:22:23 } +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 674/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.2424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43568 samples/s/p 6:22:04 } +2024-07-25 18:45:10,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 676/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.2461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:10,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43174 samples/s/p 6:22:17 } +2024-07-25 18:45:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 678/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2498461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43243 samples/s/p 6:22:11 } +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 680/ 1625], loss: 1.174, per_step_time: 1481ms, lr: 1.2535384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.40113 samples/s/p 6:24:21 } +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 682/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 1.2572307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43808 samples/s/p 6:21:42 } +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 684/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.2609231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43943 samples/s/p 6:21:33 } +2024-07-25 18:45:24,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 686/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:24,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43878 samples/s/p 6:21:33 } +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 688/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2683076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43486 samples/s/p 6:21:46 } +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 690/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.2719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43592 samples/s/p 6:21:39 } +2024-07-25 18:45:33,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 692/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.2756923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:33,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43851 samples/s/p 6:21:25 } +2024-07-25 18:45:36,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 694/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.2793846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:36,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42939 samples/s/p 6:22:01 } +2024-07-25 18:45:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 696/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 1.2830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43637 samples/s/p 6:21:28 } +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 698/ 1625], loss: 1.554, per_step_time: 1473ms, lr: 1.2867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42996 samples/s/p 6:21:52 } +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 700/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.2904615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:45,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43766 samples/s/p 6:21:17 } +2024-07-25 18:45:48,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 702/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 1.29415375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:48,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.44144 samples/s/p 6:20:58 } +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 704/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.2978461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43311 samples/s/p 6:21:30 } +2024-07-25 18:45:54,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 706/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:54,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43558 samples/s/p 6:21:17 } +2024-07-25 18:45:57,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 708/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.3052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:57,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43001 samples/s/p 6:21:37 } +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 710/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.308923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43319 samples/s/p 6:21:21 } +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 712/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 1.3126153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43239 samples/s/p 6:21:22 } +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 714/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 1.3163076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43120 samples/s/p 6:21:24 } +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 716/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.32e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43757 samples/s/p 6:20:54 } +2024-07-25 18:46:12,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 718/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.3236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:12,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43656 samples/s/p 6:20:55 } +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 720/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 1.3273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42678 samples/s/p 6:21:33 } +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 722/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.3310769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42885 samples/s/p 6:21:22 } +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 724/ 1625], loss: 1.268, per_step_time: 1474ms, lr: 1.33476915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42730 samples/s/p 6:21:25 } +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 726/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.3384615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43674 samples/s/p 6:20:43 } +2024-07-25 18:46:26,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 728/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 1.3421538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:26,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43884 samples/s/p 6:20:31 } +2024-07-25 18:46:29,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 730/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 1.3458461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:29,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43840 samples/s/p 6:20:30 } +2024-07-25 18:46:32,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 732/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3495384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:32,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42918 samples/s/p 6:21:06 } +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 734/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.3532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43534 samples/s/p 6:20:37 } +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 736/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43742 samples/s/p 6:20:25 } +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 738/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.36061535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43257 samples/s/p 6:20:42 } +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 740/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.3643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.42940 samples/s/p 6:20:53 } +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 742/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43867 samples/s/p 6:20:11 } +2024-07-25 18:46:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 744/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 1.3716922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:50,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43340 samples/s/p 6:20:30 } +2024-07-25 18:46:53,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 746/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.3753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:53,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.44194 samples/s/p 6:19:51 } +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 748/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.3790768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43309 samples/s/p 6:20:26 } +2024-07-25 18:46:59,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 750/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3827692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:59,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43505 samples/s/p 6:20:14 } +2024-07-25 18:47:02,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 752/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.38646155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:02,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43910 samples/s/p 6:19:54 } +2024-07-25 18:47:05,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 754/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.3901537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:05,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43795 samples/s/p 6:19:56 } +2024-07-25 18:47:08,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 756/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.3938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:08,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43757 samples/s/p 6:19:55 } +2024-07-25 18:47:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 758/ 1625], loss: 1.241, per_step_time: 1480ms, lr: 1.3975384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.40426 samples/s/p 6:22:13 } +2024-07-25 18:47:14,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 760/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.40123075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.44061 samples/s/p 6:19:36 } +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 762/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.404923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43263 samples/s/p 6:20:07 } +2024-07-25 18:47:19,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 764/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 1.4086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:19,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43587 samples/s/p 6:19:50 } +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 766/ 1625], loss: 1.412, per_step_time: 1472ms, lr: 1.4123077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:22,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43340 samples/s/p 6:19:58 } +2024-07-25 18:47:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 768/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.4159999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43235 samples/s/p 6:19:59 } +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 770/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.4196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.42685 samples/s/p 6:20:19 } +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 772/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.4233846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:31,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43377 samples/s/p 6:19:47 } +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 774/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 1.4270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43367 samples/s/p 6:19:45 } +2024-07-25 18:47:37,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 776/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 1.4307692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:37,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.42446 samples/s/p 6:20:21 } +2024-07-25 18:47:40,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 778/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 1.4344614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:40,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43345 samples/s/p 6:19:40 } +2024-07-25 18:47:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 780/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.4381538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:43,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43843 samples/s/p 6:19:16 } +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 782/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 1.44184605e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43383 samples/s/p 6:19:32 } +2024-07-25 18:47:49,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 784/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.4455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:49,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43568 samples/s/p 6:19:22 } +2024-07-25 18:47:52,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 786/ 1625], loss: 1.141, per_step_time: 1477ms, lr: 1.4492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:52,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.41613 samples/s/p 6:20:41 } +2024-07-25 18:47:55,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 788/ 1625], loss: 1.232, per_step_time: 1474ms, lr: 1.452923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:55,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.42709 samples/s/p 6:19:52 } +2024-07-25 18:47:58,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 790/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.4566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:58,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43538 samples/s/p 6:19:14 } +2024-07-25 18:48:01,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 792/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 1.4603076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:01,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43526 samples/s/p 6:19:12 } +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 794/ 1625], loss: 1.168, per_step_time: 1469ms, lr: 1.464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44249 samples/s/p 6:18:39 } +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 796/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.4676923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43259 samples/s/p 6:19:17 } +2024-07-25 18:48:10,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 798/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 1.4713845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:10,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43006 samples/s/p 6:19:25 } +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 800/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 1.4750769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44216 samples/s/p 6:18:31 } +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 802/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.4787692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43182 samples/s/p 6:19:11 } +2024-07-25 18:48:19,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 804/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 1.48246145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:19,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.42783 samples/s/p 6:19:25 } +2024-07-25 18:48:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 806/ 1625], loss: 1.011, per_step_time: 1470ms, lr: 1.4861538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:21,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43862 samples/s/p 6:18:37 } +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 808/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4898461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43396 samples/s/p 6:18:54 } +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 810/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 1.4935385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43309 samples/s/p 6:18:54 } +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 812/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.4972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43597 samples/s/p 6:18:39 } +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 814/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.500923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43697 samples/s/p 6:18:32 } +2024-07-25 18:48:36,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 816/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5046153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:36,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.44077 samples/s/p 6:18:13 } +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 818/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.50830765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42854 samples/s/p 6:19:02 } +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 820/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42826 samples/s/p 6:19:00 } +2024-07-25 18:48:45,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 822/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5156923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:45,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43524 samples/s/p 6:18:28 } +2024-07-25 18:48:48,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 824/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5193845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:48,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42941 samples/s/p 6:18:49 } +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 826/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.52307675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43962 samples/s/p 6:18:03 } +2024-07-25 18:48:54,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 828/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 1.5267691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:54,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43103 samples/s/p 6:18:36 } +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 830/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.5304615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43461 samples/s/p 6:18:18 } +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 832/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5341539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43073 samples/s/p 6:18:32 } +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 834/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.537846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43786 samples/s/p 6:17:59 } +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 836/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.5415384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42964 samples/s/p 6:18:30 } +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 838/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5452308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43639 samples/s/p 6:17:59 } +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 840/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.5489231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43292 samples/s/p 6:18:11 } +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 842/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.5526153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43861 samples/s/p 6:17:44 } +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 844/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.5563075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43597 samples/s/p 6:17:52 } +2024-07-25 18:49:21,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 846/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.5599999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:21,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43831 samples/s/p 6:17:39 } +2024-07-25 18:49:23,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 848/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5636922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:23,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43670 samples/s/p 6:17:43 } +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 850/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.5673846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43403 samples/s/p 6:17:51 } +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 852/ 1625], loss: 1.398, per_step_time: 1470ms, lr: 1.571077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.44015 samples/s/p 6:17:23 } +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 854/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.5747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43209 samples/s/p 6:17:54 } +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 856/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 1.5784615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42562 samples/s/p 6:18:18 } +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 858/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 1.5821537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44191 samples/s/p 6:17:07 } +2024-07-25 18:49:41,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 860/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.585846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:41,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44505 samples/s/p 6:16:51 } +2024-07-25 18:49:44,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 862/ 1625], loss: 1.296, per_step_time: 1479ms, lr: 1.5895384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:44,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.40580 samples/s/p 6:19:32 } +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 864/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 1.5932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42807 samples/s/p 6:17:56 } +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 866/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43468 samples/s/p 6:17:25 } +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 868/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6006154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43613 samples/s/p 6:17:16 } +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 870/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.6043077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43843 samples/s/p 6:17:04 } +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 872/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43420 samples/s/p 6:17:18 } +2024-07-25 18:50:02,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 874/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:02,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43519 samples/s/p 6:17:11 } +2024-07-25 18:50:05,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.6153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:05,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44124 samples/s/p 6:16:43 } +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 878/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.6190768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.42746 samples/s/p 6:17:38 } +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 880/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.6227692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43092 samples/s/p 6:17:20 } +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 882/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44049 samples/s/p 6:16:37 } +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 884/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.6301537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43250 samples/s/p 6:17:08 } +2024-07-25 18:50:20,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 886/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.6338461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:20,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.44161 samples/s/p 6:16:27 } +2024-07-25 18:50:22,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 888/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.6375385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:22,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42926 samples/s/p 6:17:15 } +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 890/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.6412308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43568 samples/s/p 6:16:46 } +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 892/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.6449228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43814 samples/s/p 6:16:33 } +2024-07-25 18:50:31,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 894/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.6486152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:31,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43208 samples/s/p 6:16:55 } +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 896/ 1625], loss: 1.447, per_step_time: 1474ms, lr: 1.6523076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42482 samples/s/p 6:17:22 } +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 898/ 1625], loss: 1.452, per_step_time: 1472ms, lr: 1.656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43478 samples/s/p 6:16:38 } +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 900/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.6596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43535 samples/s/p 6:16:32 } +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 902/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:43,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43415 samples/s/p 6:16:34 } +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 904/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 1.6670769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43993 samples/s/p 6:16:07 } +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 906/ 1625], loss: 1.376, per_step_time: 1470ms, lr: 1.6707692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:49,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43928 samples/s/p 6:16:07 } +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 908/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6744614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:52,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43844 samples/s/p 6:16:08 } +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 910/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43431 samples/s/p 6:16:22 } +2024-07-25 18:50:58,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 912/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.681846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:58,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43499 samples/s/p 6:16:16 } +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 914/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.6855383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:01,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.44041 samples/s/p 6:15:51 } +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 916/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.6892307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43217 samples/s/p 6:16:22 } +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 918/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.692923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43622 samples/s/p 6:16:02 } +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 920/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.6966154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43153 samples/s/p 6:16:19 } +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 922/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.7003076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43508 samples/s/p 6:16:01 } +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 924/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43069 samples/s/p 6:16:16 } +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 926/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.7076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43762 samples/s/p 6:15:45 } +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 928/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.7113845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43590 samples/s/p 6:15:49 } +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 930/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 1.7150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43989 samples/s/p 6:15:29 } +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 932/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.718769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43919 samples/s/p 6:15:29 } +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 934/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 1.7224615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43665 samples/s/p 6:15:37 } +2024-07-25 18:51:33,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 936/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.7261538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:33,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43370 samples/s/p 6:15:46 } +2024-07-25 18:51:36,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 938/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.7298462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:36,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43199 samples/s/p 6:15:50 } +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 940/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 1.7335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43585 samples/s/p 6:15:31 } +2024-07-25 18:51:42,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 942/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.7372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:42,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43765 samples/s/p 6:15:21 } +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 944/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.740923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43569 samples/s/p 6:15:26 } +2024-07-25 18:51:48,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 946/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.7446153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:48,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43503 samples/s/p 6:15:26 } +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 948/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 1.7483077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42849 samples/s/p 6:15:50 } +2024-07-25 18:51:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 950/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.7519998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:54,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42790 samples/s/p 6:15:50 } +2024-07-25 18:51:57,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 952/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 1.7556922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:57,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.44098 samples/s/p 6:14:52 } +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 954/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.7593846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:00,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43330 samples/s/p 6:15:21 } +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 956/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43924 samples/s/p 6:14:54 } +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 958/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.7667691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:06,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43449 samples/s/p 6:15:11 } +2024-07-25 18:52:09,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 960/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.7704613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:09,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43246 samples/s/p 6:15:16 } +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 962/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 1.7741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43757 samples/s/p 6:14:52 } +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 964/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.777846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43341 samples/s/p 6:15:06 } +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 966/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7815384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43463 samples/s/p 6:14:58 } +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 968/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.7852308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43647 samples/s/p 6:14:48 } +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 970/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.788923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:23,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43231 samples/s/p 6:15:02 } +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 972/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 1.7926153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43025 samples/s/p 6:15:08 } +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 974/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.7963077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43065 samples/s/p 6:15:03 } +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 976/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.7999999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.43128 samples/s/p 6:14:57 } +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.8036922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.44187 samples/s/p 6:14:11 } +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 980/ 1625], loss: 1.142, per_step_time: 1482ms, lr: 1.8073844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.39637 samples/s/p 6:17:17 } +2024-07-25 18:52:41,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 982/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 1.8110768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:41,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.42897 samples/s/p 6:14:58 } +2024-07-25 18:52:44,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 984/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.8147692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:44,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43459 samples/s/p 6:14:32 } +2024-07-25 18:52:47,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 986/ 1625], loss: 1.310, per_step_time: 1470ms, lr: 1.8184615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43991 samples/s/p 6:14:07 } +2024-07-25 18:52:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 988/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.8221539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:50,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43568 samples/s/p 6:14:21 } +2024-07-25 18:52:53,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 990/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.825846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43271 samples/s/p 6:14:31 } +2024-07-25 18:52:56,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 992/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.8295383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:56,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43286 samples/s/p 6:14:27 } +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 994/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.8332306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43729 samples/s/p 6:14:06 } +2024-07-25 18:53:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 996/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43072 samples/s/p 6:14:30 } +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 998/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.8406154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43544 samples/s/p 6:14:08 } +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1000/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.8443076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43862 samples/s/p 6:13:52 } +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1002/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43323 samples/s/p 6:14:11 } +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1004/ 1625], loss: 1.311, per_step_time: 1474ms, lr: 1.8516923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.42685 samples/s/p 6:14:34 } +2024-07-25 18:53:17,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1006/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.8553847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:17,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43171 samples/s/p 6:14:11 } +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1008/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.859077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43528 samples/s/p 6:13:54 } +2024-07-25 18:53:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1010/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.862769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43558 samples/s/p 6:13:50 } +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1012/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 1.8664614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43970 samples/s/p 6:13:30 } +2024-07-25 18:53:28,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1014/ 1625], loss: 1.070, per_step_time: 1469ms, lr: 1.8701538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:28,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.44284 samples/s/p 6:13:14 } +2024-07-25 18:53:31,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1016/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.8738461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43895 samples/s/p 6:13:27 } +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1018/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.8775383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43044 samples/s/p 6:13:59 } +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1020/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.8812307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43737 samples/s/p 6:13:27 } +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1022/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.884923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:40,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.42949 samples/s/p 6:13:57 } +2024-07-25 18:53:43,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1024/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 1.8886154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43188 samples/s/p 6:13:44 } +2024-07-25 18:53:46,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1026/ 1625], loss: 1.394, per_step_time: 1470ms, lr: 1.8923076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:46,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.44076 samples/s/p 6:13:05 } +2024-07-25 18:53:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1028/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.8959998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:49,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43795 samples/s/p 6:13:13 } +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1030/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.8996921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:52,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43564 samples/s/p 6:13:20 } +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1032/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.9033845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43489 samples/s/p 6:13:20 } +2024-07-25 18:53:58,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1034/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.9070769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:58,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43622 samples/s/p 6:13:12 } +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1036/ 1625], loss: 1.235, per_step_time: 1476ms, lr: 1.9107692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.41907 samples/s/p 6:14:19 } +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1038/ 1625], loss: 1.303, per_step_time: 1475ms, lr: 1.9144614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42362 samples/s/p 6:13:58 } +2024-07-25 18:54:07,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1040/ 1625], loss: 1.367, per_step_time: 1473ms, lr: 1.9181538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:07,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43024 samples/s/p 6:13:27 } +2024-07-25 18:54:10,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1042/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.921846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:10,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43082 samples/s/p 6:13:22 } +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1044/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 1.9255383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42763 samples/s/p 6:13:32 } +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1046/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 1.9292307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42889 samples/s/p 6:13:24 } +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1048/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.9329229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43642 samples/s/p 6:12:50 } +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1050/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.9366153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43608 samples/s/p 6:12:49 } +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1052/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.9403076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43519 samples/s/p 6:12:49 } +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1054/ 1625], loss: 1.456, per_step_time: 1473ms, lr: 1.944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43101 samples/s/p 6:13:04 } +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1056/ 1625], loss: 0.973, per_step_time: 1474ms, lr: 1.9476924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42691 samples/s/p 6:13:18 } +2024-07-25 18:54:33,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1058/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.9513845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:33,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44136 samples/s/p 6:12:15 } +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1060/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.9550767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44109 samples/s/p 6:12:13 } +2024-07-25 18:54:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1062/ 1625], loss: 1.185, per_step_time: 1474ms, lr: 1.9587691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:39,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42482 samples/s/p 6:13:17 } +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1064/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.9624615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43554 samples/s/p 6:12:30 } +2024-07-25 18:54:45,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1066/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9661538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43924 samples/s/p 6:12:12 } +2024-07-25 18:54:48,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1068/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.969846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43074 samples/s/p 6:12:44 } +2024-07-25 18:54:51,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1070/ 1625], loss: 1.237, per_step_time: 1470ms, lr: 1.9735384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:51,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.44018 samples/s/p 6:12:02 } +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1072/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.9772307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43518 samples/s/p 6:12:20 } +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1074/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.9809231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43628 samples/s/p 6:12:12 } +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1076/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 1.9846153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43676 samples/s/p 6:12:08 } +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1078/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.9883075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43231 samples/s/p 6:12:23 } +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1080/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.9919999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43400 samples/s/p 6:12:13 } +2024-07-25 18:55:09,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1082/ 1625], loss: 1.403, per_step_time: 1472ms, lr: 1.9956922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:09,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43217 samples/s/p 6:12:18 } +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1084/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.9993846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43363 samples/s/p 6:12:09 } +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1086/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.0030768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42898 samples/s/p 6:12:25 } +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1088/ 1625], loss: 1.225, per_step_time: 1474ms, lr: 2.0067691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42573 samples/s/p 6:12:35 } +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1090/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0104615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43178 samples/s/p 6:12:07 } +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1092/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.0141539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43825 samples/s/p 6:11:38 } +2024-07-25 18:55:27,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1094/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.017846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:27,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43013 samples/s/p 6:12:08 } +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1096/ 1625], loss: 1.179, per_step_time: 1474ms, lr: 2.0215382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42672 samples/s/p 6:12:19 } +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1098/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.0252306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43518 samples/s/p 6:11:42 } +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1100/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.028923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43301 samples/s/p 6:11:48 } +2024-07-25 18:55:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1102/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0326153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:38,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43398 samples/s/p 6:11:41 } +2024-07-25 18:55:41,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1104/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.0363077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:41,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.44081 samples/s/p 6:11:10 } +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1106/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.0399999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:44,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43315 samples/s/p 6:11:38 } +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1108/ 1625], loss: 1.259, per_step_time: 1476ms, lr: 2.0436923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.41663 samples/s/p 6:12:43 } +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1110/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.0473844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43260 samples/s/p 6:11:35 } +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1112/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0510768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.42988 samples/s/p 6:11:43 } +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1114/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 2.0547692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42739 samples/s/p 6:11:50 } +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1116/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.0584614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43370 samples/s/p 6:11:21 } +2024-07-25 18:56:02,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1118/ 1625], loss: 1.069, per_step_time: 1476ms, lr: 2.0621537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.41801 samples/s/p 6:12:23 } +2024-07-25 18:56:05,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1120/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.0658461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:05,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43189 samples/s/p 6:11:23 } +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1122/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.0695385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43358 samples/s/p 6:11:13 } +2024-07-25 18:56:11,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1124/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0732308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:11,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43718 samples/s/p 6:10:55 } +2024-07-25 18:56:14,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1126/ 1625], loss: 1.313, per_step_time: 1471ms, lr: 2.0769228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:14,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43641 samples/s/p 6:10:55 } +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1128/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 2.0806152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42985 samples/s/p 6:11:19 } +2024-07-25 18:56:20,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1130/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0843076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:20,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43994 samples/s/p 6:10:35 } +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1132/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43606 samples/s/p 6:10:48 } +2024-07-25 18:56:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1134/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.0916923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43511 samples/s/p 6:10:49 } +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1136/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.0953845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43238 samples/s/p 6:10:57 } +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1138/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0990768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43108 samples/s/p 6:11:00 } +2024-07-25 18:56:34,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1140/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.1027692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:34,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43547 samples/s/p 6:10:39 } +2024-07-25 18:56:37,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1142/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.1064616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42746 samples/s/p 6:11:08 } +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1144/ 1625], loss: 1.341, per_step_time: 1474ms, lr: 2.1101538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42634 samples/s/p 6:11:10 } +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1146/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43441 samples/s/p 6:10:34 } +2024-07-25 18:56:46,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1148/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 2.1175383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:46,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42857 samples/s/p 6:10:55 } +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1150/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.1212307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42798 samples/s/p 6:10:55 } +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1152/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.124923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43274 samples/s/p 6:10:32 } +2024-07-25 18:56:55,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1154/ 1625], loss: 0.892, per_step_time: 1471ms, lr: 2.1286154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43779 samples/s/p 6:10:09 } +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1156/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.1323076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43349 samples/s/p 6:10:23 } +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1158/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43146 samples/s/p 6:10:29 } +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1160/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.1396922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43332 samples/s/p 6:10:18 } +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1162/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 2.1433845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.44408 samples/s/p 6:09:31 } +2024-07-25 18:57:10,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1164/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.1470767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43704 samples/s/p 6:09:57 } +2024-07-25 18:57:13,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1166/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:13,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43267 samples/s/p 6:10:12 } +2024-07-25 18:57:16,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1168/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.1544614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:16,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43520 samples/s/p 6:09:59 } +2024-07-25 18:57:19,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1170/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.1581538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:19,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43542 samples/s/p 6:09:55 } +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1172/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 2.1618462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.41792 samples/s/p 6:11:03 } +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1174/ 1625], loss: 1.450, per_step_time: 1471ms, lr: 2.1655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:25,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43839 samples/s/p 6:09:37 } +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1176/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 2.1692307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43100 samples/s/p 6:10:04 } +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1178/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1729229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43672 samples/s/p 6:09:38 } +2024-07-25 18:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1180/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.1766153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:33,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43231 samples/s/p 6:09:53 } +2024-07-25 18:57:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1182/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.1803076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:36,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43712 samples/s/p 6:09:30 } +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1184/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.1839998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42955 samples/s/p 6:09:58 } +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1186/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 2.1876922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43059 samples/s/p 6:09:51 } +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1188/ 1625], loss: 1.028, per_step_time: 1475ms, lr: 2.1913846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42250 samples/s/p 6:10:21 } +2024-07-25 18:57:48,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1190/ 1625], loss: 1.326, per_step_time: 1470ms, lr: 2.195077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:48,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.44091 samples/s/p 6:09:03 } +2024-07-25 18:57:51,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1192/ 1625], loss: 1.019, per_step_time: 1474ms, lr: 2.1987693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:51,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42530 samples/s/p 6:10:04 } +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1194/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 2.2024613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43514 samples/s/p 6:09:20 } +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1196/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.2061537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43749 samples/s/p 6:09:08 } +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1198/ 1625], loss: 0.908, per_step_time: 1471ms, lr: 2.209846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43784 samples/s/p 6:09:04 } +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1200/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.2135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:03,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43635 samples/s/p 6:09:07 } +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1202/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.2172308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43176 samples/s/p 6:09:22 } +2024-07-25 18:58:09,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1204/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 2.220923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:09,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43001 samples/s/p 6:09:27 } +2024-07-25 18:58:12,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1206/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.2246153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:12,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43503 samples/s/p 6:09:03 } +2024-07-25 18:58:15,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1208/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.2283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:15,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43282 samples/s/p 6:09:09 } +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1210/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.2319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:18,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43304 samples/s/p 6:09:05 } +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1212/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.2356922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.44214 samples/s/p 6:08:26 } +2024-07-25 18:58:24,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1214/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.2393844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43337 samples/s/p 6:08:58 } +2024-07-25 18:58:27,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1216/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.2430768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:27,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43862 samples/s/p 6:08:34 } +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1218/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.2467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43400 samples/s/p 6:08:50 } +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1220/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.2504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43835 samples/s/p 6:08:29 } +2024-07-25 18:58:35,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1222/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.2541539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43392 samples/s/p 6:08:44 } +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1224/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.257846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:38,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.42973 samples/s/p 6:08:58 } +2024-07-25 18:58:41,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1226/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.2615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:41,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43584 samples/s/p 6:08:31 } +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1228/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.2652306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43545 samples/s/p 6:08:29 } +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1230/ 1625], loss: 1.198, per_step_time: 1474ms, lr: 2.268923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:47,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.42549 samples/s/p 6:09:07 } +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1232/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2726152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43335 samples/s/p 6:08:32 } +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1234/ 1625], loss: 1.409, per_step_time: 1471ms, lr: 2.2763075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43663 samples/s/p 6:08:16 } +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1236/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2799999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43785 samples/s/p 6:08:08 } +2024-07-25 18:58:59,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1238/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 2.2836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:59,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43590 samples/s/p 6:08:13 } +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1240/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.2873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43814 samples/s/p 6:08:01 } +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.2910768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43631 samples/s/p 6:08:05 } +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1244/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.294769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.44042 samples/s/p 6:07:45 } +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1246/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2984614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:11,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.42947 samples/s/p 6:08:27 } +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1248/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.3021537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43507 samples/s/p 6:08:01 } +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1250/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3058461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43520 samples/s/p 6:07:58 } +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1252/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43342 samples/s/p 6:08:02 } +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1254/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.3132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43760 samples/s/p 6:07:42 } +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1256/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43188 samples/s/p 6:08:02 } +2024-07-25 18:59:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1258/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.3206154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43545 samples/s/p 6:07:45 } +2024-07-25 18:59:32,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1260/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.3243078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:32,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42525 samples/s/p 6:08:24 } +2024-07-25 18:59:34,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1262/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3279998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42921 samples/s/p 6:08:04 } +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1264/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.3316921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43614 samples/s/p 6:07:33 } +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1266/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.3353845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43972 samples/s/p 6:07:16 } +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1268/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.3390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43932 samples/s/p 6:07:15 } +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.3427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:46,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43411 samples/s/p 6:07:33 } +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1272/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3464614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43556 samples/s/p 6:07:24 } +2024-07-25 18:59:52,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1274/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.3501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:52,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43046 samples/s/p 6:07:42 } +2024-07-25 18:59:55,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1276/ 1625], loss: 1.259, per_step_time: 1475ms, lr: 2.3538461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:55,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42205 samples/s/p 6:08:13 } +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1278/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.3575383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44076 samples/s/p 6:06:54 } +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1280/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 2.3612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44101 samples/s/p 6:06:50 } +2024-07-25 19:00:04,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1282/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.3649229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43207 samples/s/p 6:07:23 } +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1284/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.3686152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43842 samples/s/p 6:06:55 } +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1286/ 1625], loss: 0.877, per_step_time: 1471ms, lr: 2.3723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43580 samples/s/p 6:07:02 } +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1288/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43569 samples/s/p 6:07:00 } +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1290/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.3796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:16,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42953 samples/s/p 6:07:22 } +2024-07-25 19:00:19,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1292/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3833845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:19,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43111 samples/s/p 6:07:13 } +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1294/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.3870767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:22,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.42968 samples/s/p 6:07:15 } +2024-07-25 19:00:25,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1296/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.44011 samples/s/p 6:06:30 } +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1298/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.3944614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:28,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43689 samples/s/p 6:06:40 } +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1300/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 2.3981538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.44495 samples/s/p 6:06:05 } +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1302/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 2.401846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43101 samples/s/p 6:06:58 } +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1304/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 2.4055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.42410 samples/s/p 6:07:23 } +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1306/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.4092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43214 samples/s/p 6:06:48 } +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1308/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.4129231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43689 samples/s/p 6:06:26 } +2024-07-25 19:00:45,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1310/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.4166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:45,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.42985 samples/s/p 6:06:51 } +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1312/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.4203075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44162 samples/s/p 6:06:01 } +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1314/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.4239998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44215 samples/s/p 6:05:56 } +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1316/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.4276922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43525 samples/s/p 6:06:20 } +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1318/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.4313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43333 samples/s/p 6:06:25 } +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1320/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.4350767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43522 samples/s/p 6:06:15 } +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1322/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.4387691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:03,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43406 samples/s/p 6:06:16 } +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1324/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.4424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43012 samples/s/p 6:06:29 } +2024-07-25 19:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1326/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 2.4461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43210 samples/s/p 6:06:18 } +2024-07-25 19:01:12,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1328/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.449846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43517 samples/s/p 6:06:03 } +2024-07-25 19:01:15,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1330/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.4535382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:15,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44184 samples/s/p 6:05:33 } +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1332/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.4572306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43760 samples/s/p 6:05:47 } +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1334/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.460923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:21,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43236 samples/s/p 6:06:06 } +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1336/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.4646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43692 samples/s/p 6:05:44 } +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1338/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.4683077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44047 samples/s/p 6:05:27 } +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1340/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.4719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43465 samples/s/p 6:05:48 } +2024-07-25 19:01:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1342/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.4756922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:33,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43344 samples/s/p 6:05:49 } +2024-07-25 19:01:35,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1344/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.4793844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:35,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43305 samples/s/p 6:05:48 } +2024-07-25 19:01:38,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:38,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43489 samples/s/p 6:05:38 } +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1348/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.4867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43419 samples/s/p 6:05:38 } +2024-07-25 19:01:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1350/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.4904613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43531 samples/s/p 6:05:30 } +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1352/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.4941537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43578 samples/s/p 6:05:25 } +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1354/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.497846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43721 samples/s/p 6:05:17 } +2024-07-25 19:01:53,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1356/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.5015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43544 samples/s/p 6:05:21 } +2024-07-25 19:01:56,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1358/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 2.5052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:56,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43404 samples/s/p 6:05:24 } +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1360/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.508923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43413 samples/s/p 6:05:20 } +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1362/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.5126152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43099 samples/s/p 6:05:30 } +2024-07-25 19:02:05,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1364/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5163075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:05,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43752 samples/s/p 6:05:01 } +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1366/ 1625], loss: 1.220, per_step_time: 1474ms, lr: 2.5199999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.42699 samples/s/p 6:05:40 } +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1368/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43522 samples/s/p 6:05:04 } +2024-07-25 19:02:14,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1370/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.5273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:14,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43728 samples/s/p 6:04:53 } +2024-07-25 19:02:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1372/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.5310768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43825 samples/s/p 6:04:46 } +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1374/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.5347692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:20,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43323 samples/s/p 6:05:03 } +2024-07-25 19:02:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1376/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5384616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43800 samples/s/p 6:04:41 } +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1378/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.5421536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42846 samples/s/p 6:05:17 } +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1380/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.545846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:29,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43462 samples/s/p 6:04:49 } +2024-07-25 19:02:32,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1382/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5495383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:32,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43559 samples/s/p 6:04:42 } +2024-07-25 19:02:34,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1384/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.5532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:34,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42797 samples/s/p 6:05:10 } +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1386/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.556923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:37,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42929 samples/s/p 6:05:01 } +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1388/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 2.5606152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42632 samples/s/p 6:05:10 } +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1390/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.5643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43729 samples/s/p 6:04:23 } +2024-07-25 19:02:46,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1392/ 1625], loss: 1.372, per_step_time: 1471ms, lr: 2.568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43543 samples/s/p 6:04:28 } +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1394/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.5716923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:49,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43687 samples/s/p 6:04:19 } +2024-07-25 19:02:52,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1396/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43768 samples/s/p 6:04:13 } +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1398/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.5790767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:55,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.44122 samples/s/p 6:03:56 } +2024-07-25 19:02:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1400/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.582769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43611 samples/s/p 6:04:13 } +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:03:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1402/ 1625], loss: 1.293, per_step_time: 1477ms, lr: 2.5864614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.41551 samples/s/p 6:05:34 } +2024-07-25 19:03:38,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1404/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.5901538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:38,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43224 samples/s/p 6:04:23 } +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1406/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.5938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43592 samples/s/p 6:04:05 } +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1408/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5975383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43879 samples/s/p 6:03:51 } +2024-07-25 19:03:47,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1410/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6012307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:47,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43690 samples/s/p 6:03:55 } +2024-07-25 19:03:50,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1412/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.6049229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:50,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43532 samples/s/p 6:03:59 } +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1414/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.6086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43152 samples/s/p 6:04:11 } +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1416/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.6123076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43834 samples/s/p 6:03:41 } +2024-07-25 19:03:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1418/ 1625], loss: 1.287, per_step_time: 1473ms, lr: 2.6159998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43032 samples/s/p 6:04:10 } +2024-07-25 19:04:01,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1420/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.6196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:01,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.42963 samples/s/p 6:04:10 } +2024-07-25 19:04:04,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1422/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 2.6233845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43543 samples/s/p 6:03:44 } +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1424/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.6270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43193 samples/s/p 6:03:55 } +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1426/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6307693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:10,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.42905 samples/s/p 6:04:03 } +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 2.6344613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:13,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43955 samples/s/p 6:03:18 } +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1430/ 1625], loss: 1.287, per_step_time: 1469ms, lr: 2.6381536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44380 samples/s/p 6:02:58 } +2024-07-25 19:04:19,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1432/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.641846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:19,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44089 samples/s/p 6:03:07 } +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1434/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.6455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:22,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43212 samples/s/p 6:03:39 } +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1436/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43909 samples/s/p 6:03:08 } +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1438/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.652923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44030 samples/s/p 6:03:01 } +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1440/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 2.6566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43503 samples/s/p 6:03:19 } +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1442/ 1625], loss: 1.485, per_step_time: 1471ms, lr: 2.6603077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43614 samples/s/p 6:03:11 } +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1444/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43182 samples/s/p 6:03:26 } +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1446/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.6676922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43241 samples/s/p 6:03:20 } +2024-07-25 19:04:43,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1448/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6713844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:43,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43190 samples/s/p 6:03:20 } +2024-07-25 19:04:46,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1450/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.6750768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:46,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43833 samples/s/p 6:02:51 } +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1452/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 2.6787691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:49,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.42995 samples/s/p 6:03:22 } +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1454/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.6824615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43360 samples/s/p 6:03:04 } +2024-07-25 19:04:55,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1456/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.6861537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:55,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43203 samples/s/p 6:03:07 } +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1458/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.689846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43064 samples/s/p 6:03:10 } +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1460/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6935384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43781 samples/s/p 6:02:38 } +2024-07-25 19:05:03,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1462/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.6972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:03,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44139 samples/s/p 6:02:21 } +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1464/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.700923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44123 samples/s/p 6:02:19 } +2024-07-25 19:05:09,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1466/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.7046151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:09,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43932 samples/s/p 6:02:23 } +2024-07-25 19:05:12,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1468/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.7083075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43150 samples/s/p 6:02:52 } +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1470/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.7119999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43582 samples/s/p 6:02:32 } +2024-07-25 19:05:18,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1472/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 2.7156922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:18,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43034 samples/s/p 6:02:50 } +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1474/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.7193846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.44175 samples/s/p 6:02:02 } +2024-07-25 19:05:24,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1476/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.7230768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:24,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42702 samples/s/p 6:02:58 } +2024-07-25 19:05:27,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1478/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.7267692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:27,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43481 samples/s/p 6:02:24 } +2024-07-25 19:05:30,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1480/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.7304613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:30,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43437 samples/s/p 6:02:23 } +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1482/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.7341537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43417 samples/s/p 6:02:20 } +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1484/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.737846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42773 samples/s/p 6:02:43 } +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1486/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.7415383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42898 samples/s/p 6:02:35 } +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1488/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.7452306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43296 samples/s/p 6:02:16 } +2024-07-25 19:05:45,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1490/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.748923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:45,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43571 samples/s/p 6:02:03 } +2024-07-25 19:05:48,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1492/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.7526154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:48,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43424 samples/s/p 6:02:05 } +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1494/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.7563077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43408 samples/s/p 6:02:03 } +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1496/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 2.7599997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43542 samples/s/p 6:01:55 } +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1498/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7636921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:57,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43218 samples/s/p 6:02:05 } +2024-07-25 19:06:00,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1500/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 2.7673845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:00,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43479 samples/s/p 6:01:51 } +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1502/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.7710768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43265 samples/s/p 6:01:57 } +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1504/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.7747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:05,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42755 samples/s/p 6:02:15 } +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1506/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.7784614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43709 samples/s/p 6:01:33 } +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1508/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.7821538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43471 samples/s/p 6:01:40 } +2024-07-25 19:06:14,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1510/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 2.7858461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:14,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43078 samples/s/p 6:01:53 } +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1512/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7895383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43418 samples/s/p 6:01:36 } +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1514/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.7932307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43249 samples/s/p 6:01:40 } +2024-07-25 19:06:23,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1516/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.7969229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:23,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42825 samples/s/p 6:01:54 } +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1518/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8006152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43985 samples/s/p 6:01:05 } +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1520/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8043076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43373 samples/s/p 6:01:26 } +2024-07-25 19:06:32,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:32,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43288 samples/s/p 6:01:27 } +2024-07-25 19:06:35,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1524/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 2.8116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:35,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43251 samples/s/p 6:01:25 } +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1526/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.8153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42684 samples/s/p 6:01:45 } +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1528/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8190769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43421 samples/s/p 6:01:13 } +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1530/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.822769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43805 samples/s/p 6:00:54 } +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1532/ 1625], loss: 1.023, per_step_time: 1473ms, lr: 2.8264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42941 samples/s/p 6:01:26 } +2024-07-25 19:06:50,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1534/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.8301536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:50,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43726 samples/s/p 6:00:52 } +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1536/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43953 samples/s/p 6:00:40 } +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1538/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.8375383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:56,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43839 samples/s/p 6:00:41 } +2024-07-25 19:06:59,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1540/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.8412307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43609 samples/s/p 6:00:47 } +2024-07-25 19:07:02,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1542/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.844923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:02,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43105 samples/s/p 6:01:05 } +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1544/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8486153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43209 samples/s/p 6:00:57 } +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1546/ 1625], loss: 0.967, per_step_time: 1475ms, lr: 2.8523074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.42354 samples/s/p 6:01:29 } +2024-07-25 19:07:10,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1548/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8559998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43201 samples/s/p 6:00:52 } +2024-07-25 19:07:13,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1550/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8596922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:13,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43214 samples/s/p 6:00:48 } +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1552/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.8633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43709 samples/s/p 6:00:26 } +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1554/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.8670767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43199 samples/s/p 6:00:43 } +2024-07-25 19:07:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1556/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.8707691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42801 samples/s/p 6:00:56 } +2024-07-25 19:07:25,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1558/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.8744615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:25,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43406 samples/s/p 6:00:29 } +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1560/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43581 samples/s/p 6:00:19 } +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1562/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8818462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43157 samples/s/p 6:00:33 } +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1564/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8855382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43588 samples/s/p 6:00:13 } +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1566/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.8892306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42613 samples/s/p 6:00:49 } +2024-07-25 19:07:40,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1568/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.892923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:40,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42939 samples/s/p 6:00:33 } +2024-07-25 19:07:43,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1570/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 2.8966153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:43,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.42867 samples/s/p 6:00:33 } +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1572/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.9003077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43082 samples/s/p 6:00:21 } +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1574/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.9039998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:49,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43724 samples/s/p 5:59:53 } +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1576/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43336 samples/s/p 6:00:05 } +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1578/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43326 samples/s/p 6:00:03 } +2024-07-25 19:07:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1580/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.9150768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:58,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.44027 samples/s/p 5:59:32 } +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1582/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.9187691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43750 samples/s/p 5:59:40 } +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1584/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9224613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43557 samples/s/p 5:59:45 } +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1586/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 2.9261537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:06,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43829 samples/s/p 5:59:31 } +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1588/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.929846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43596 samples/s/p 5:59:37 } +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1590/ 1625], loss: 1.431, per_step_time: 1471ms, lr: 2.9335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43636 samples/s/p 5:59:33 } +2024-07-25 19:08:15,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:15,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43266 samples/s/p 5:59:44 } +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1594/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.940923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:18,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43484 samples/s/p 5:59:33 } +2024-07-25 19:08:21,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1596/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 2.9446152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:21,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.42204 samples/s/p 6:00:21 } +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1598/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.9483075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.44106 samples/s/p 5:59:02 } +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1600/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.9519999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43702 samples/s/p 5:59:15 } +2024-07-25 19:08:30,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1602/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.955692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43099 samples/s/p 5:59:36 } +2024-07-25 19:08:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1604/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.9593844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42525 samples/s/p 5:59:56 } +2024-07-25 19:08:36,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1606/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.9630768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:36,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43482 samples/s/p 5:59:15 } +2024-07-25 19:08:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1608/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9667692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43137 samples/s/p 5:59:26 } +2024-07-25 19:08:42,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1610/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.9704615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:42,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42381 samples/s/p 5:59:53 } +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1612/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43765 samples/s/p 5:58:55 } +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1614/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.9778459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:48,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43421 samples/s/p 5:59:06 } +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1616/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9815383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43138 samples/s/p 5:59:14 } +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1618/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9852306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.44138 samples/s/p 5:58:32 } +2024-07-25 19:08:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1620/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.988923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43342 samples/s/p 5:59:00 } +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1622/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9926152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:00,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43674 samples/s/p 5:58:44 } +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1624/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 2.9963076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43249 samples/s/p 5:58:58 } +2024-07-25 19:09:06,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1478ms, lr: 3e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:06,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.41143 samples/s/p 6:00:19 } +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 3/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.9999997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43844 samples/s/p 5:58:29 } +2024-07-25 19:09:11,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 5/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.9999994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:11,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43446 samples/s/p 5:58:41 } +2024-07-25 19:09:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 7/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.9999987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:14,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43366 samples/s/p 5:58:42 } +2024-07-25 19:09:17,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 9/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.999998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:17,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43563 samples/s/p 5:58:31 } +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 11/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 2.9999967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43039 samples/s/p 5:58:49 } +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 13/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9999952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.42537 samples/s/p 5:59:06 } +2024-07-25 19:09:26,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 15/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9999934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43549 samples/s/p 5:58:23 } +2024-07-25 19:09:29,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 17/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9999912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:29,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43446 samples/s/p 5:58:24 } +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 19/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.999989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43536 samples/s/p 5:58:17 } +2024-07-25 19:09:35,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 21/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.9999865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:35,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43436 samples/s/p 5:58:18 } +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 23/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.9999837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43949 samples/s/p 5:57:55 } +2024-07-25 19:09:41,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 25/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9999806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:41,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43792 samples/s/p 5:57:58 } +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 27/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9999774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43712 samples/s/p 5:57:59 } +2024-07-25 19:09:47,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 29/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.9999737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:47,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43752 samples/s/p 5:57:54 } +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 31/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.99997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43759 samples/s/p 5:57:51 } +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 33/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9999657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43467 samples/s/p 5:57:59 } +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 35/ 1625], loss: 1.368, per_step_time: 1470ms, lr: 2.9999612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43852 samples/s/p 5:57:41 } +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 37/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9999566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43824 samples/s/p 5:57:39 } +2024-07-25 19:10:02,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 39/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.9999517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:02,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43982 samples/s/p 5:57:30 } +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 41/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 2.9999464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44026 samples/s/p 5:57:26 } +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 43/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9999408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43105 samples/s/p 5:57:59 } +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 45/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9999354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:10,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43973 samples/s/p 5:57:22 } +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 47/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.999929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43609 samples/s/p 5:57:33 } +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 49/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.9999228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43653 samples/s/p 5:57:28 } +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 51/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.9999163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43487 samples/s/p 5:57:32 } +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 53/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 2.9999095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.42413 samples/s/p 5:58:12 } +2024-07-25 19:10:25,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 55/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 2.9999024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:25,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44215 samples/s/p 5:56:58 } +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 57/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.999895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:28,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43260 samples/s/p 5:57:32 } +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 59/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 2.9998875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43870 samples/s/p 5:57:05 } +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 61/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.9998797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:34,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42923 samples/s/p 5:57:40 } +2024-07-25 19:10:37,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 63/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9998713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:37,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43249 samples/s/p 5:57:24 } +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 65/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.999863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42817 samples/s/p 5:57:38 } +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 67/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9998542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43180 samples/s/p 5:57:21 } +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 69/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.9998453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42868 samples/s/p 5:57:30 } +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 71/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.999836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43671 samples/s/p 5:56:55 } +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 73/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9998266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43479 samples/s/p 5:57:00 } +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 75/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9998168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43821 samples/s/p 5:56:44 } +2024-07-25 19:10:58,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 77/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9998067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:58,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43576 samples/s/p 5:56:50 } +2024-07-25 19:11:01,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 79/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9997964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:01,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43645 samples/s/p 5:56:45 } +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 81/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9997858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43316 samples/s/p 5:56:55 } +2024-07-25 19:11:07,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 83/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.999775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:07,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42752 samples/s/p 5:57:14 } +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 85/ 1625], loss: 1.437, per_step_time: 1471ms, lr: 2.9997638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43570 samples/s/p 5:56:39 } +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 87/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.9997524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:12,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42652 samples/s/p 5:57:12 } +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 89/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.9997409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43713 samples/s/p 5:56:27 } +2024-07-25 19:11:18,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 91/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9997289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:18,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43397 samples/s/p 5:56:37 } +2024-07-25 19:11:21,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 93/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9997167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:21,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43092 samples/s/p 5:56:46 } +2024-07-25 19:11:24,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 95/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 2.9997043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:24,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43357 samples/s/p 5:56:32 } +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 97/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9996916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43301 samples/s/p 5:56:32 } +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 99/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9996787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43278 samples/s/p 5:56:30 } +2024-07-25 19:11:33,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 101/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 2.9996652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:33,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.44321 samples/s/p 5:55:46 } +2024-07-25 19:11:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 103/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.9996518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43134 samples/s/p 5:56:29 } +2024-07-25 19:11:39,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 105/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9996381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:39,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43744 samples/s/p 5:56:02 } +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 2.9996241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:42,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42409 samples/s/p 5:56:52 } +2024-07-25 19:11:45,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 109/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9996096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:45,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43735 samples/s/p 5:55:57 } +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 111/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 2.999595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43595 samples/s/p 5:56:00 } +2024-07-25 19:11:51,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 113/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 2.9995803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:51,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43081 samples/s/p 5:56:17 } +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 115/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9995652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43606 samples/s/p 5:55:53 } +2024-07-25 19:11:57,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 117/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.9995497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:57,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43346 samples/s/p 5:56:00 } +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 119/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9995343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43192 samples/s/p 5:56:04 } +2024-07-25 19:12:03,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 121/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9995184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:03,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42993 samples/s/p 5:56:08 } +2024-07-25 19:12:06,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 123/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.999502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:06,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43155 samples/s/p 5:55:59 } +2024-07-25 19:12:09,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 125/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 2.9994857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:09,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.44015 samples/s/p 5:55:22 } +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 127/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.9994688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43387 samples/s/p 5:55:44 } +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 129/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.999452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42946 samples/s/p 5:55:59 } +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 131/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.9994346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43879 samples/s/p 5:55:19 } +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 133/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9994171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43777 samples/s/p 5:55:20 } +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 135/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.9993993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42818 samples/s/p 5:55:55 } +2024-07-25 19:12:26,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 137/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.9993813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:26,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43187 samples/s/p 5:55:37 } +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 139/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.9993627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43265 samples/s/p 5:55:31 } +2024-07-25 19:12:32,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 141/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.9993444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:32,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43370 samples/s/p 5:55:24 } +2024-07-25 19:12:35,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 143/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9993254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:35,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42940 samples/s/p 5:55:38 } +2024-07-25 19:12:38,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 145/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.9993065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:38,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43072 samples/s/p 5:55:30 } +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 147/ 1625], loss: 1.284, per_step_time: 1469ms, lr: 2.9992867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.44326 samples/s/p 5:54:38 } +2024-07-25 19:12:44,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 149/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.9992674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:44,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42845 samples/s/p 5:55:33 } +2024-07-25 19:12:47,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 151/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 2.9992474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:47,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43382 samples/s/p 5:55:09 } +2024-07-25 19:12:50,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 153/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.9992269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:50,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43441 samples/s/p 5:55:04 } +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 155/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9992065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:53,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43334 samples/s/p 5:55:05 } +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 157/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9991857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43352 samples/s/p 5:55:01 } +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 159/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9991646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:59,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43330 samples/s/p 5:54:59 } +2024-07-25 19:13:02,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 161/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9991435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:02,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43681 samples/s/p 5:54:43 } +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 163/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.9991223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43516 samples/s/p 5:54:46 } +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 165/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.9991003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:08,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43059 samples/s/p 5:55:01 } +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 167/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.999078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43209 samples/s/p 5:54:52 } +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 169/ 1625], loss: 1.446, per_step_time: 1471ms, lr: 2.9990559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43842 samples/s/p 5:54:25 } +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 171/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 2.9990333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:16,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43248 samples/s/p 5:54:45 } +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 173/ 1625], loss: 1.360, per_step_time: 1472ms, lr: 2.9990104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43111 samples/s/p 5:54:47 } +2024-07-25 19:13:22,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 175/ 1625], loss: 1.309, per_step_time: 1471ms, lr: 2.9989871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:22,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43541 samples/s/p 5:54:27 } +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 177/ 1625], loss: 0.964, per_step_time: 1472ms, lr: 2.9989636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43239 samples/s/p 5:54:36 } +2024-07-25 19:13:28,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 179/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.99894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42847 samples/s/p 5:54:49 } +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 181/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.9989162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43791 samples/s/p 5:54:09 } +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 183/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.998892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.44069 samples/s/p 5:53:55 } +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 185/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 2.9988674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43098 samples/s/p 5:54:30 } +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 187/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.9988425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43425 samples/s/p 5:54:14 } +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 189/ 1625], loss: 1.393, per_step_time: 1472ms, lr: 2.9988176e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43123 samples/s/p 5:54:23 } +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 191/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9987923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43172 samples/s/p 5:54:18 } +2024-07-25 19:13:49,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 193/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.9987668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:49,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43372 samples/s/p 5:54:08 } +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 195/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9987412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:52,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43185 samples/s/p 5:54:12 } +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 197/ 1625], loss: 1.166, per_step_time: 1469ms, lr: 2.998715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:55,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.44224 samples/s/p 5:53:28 } +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 199/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.9986886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43180 samples/s/p 5:54:06 } +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 201/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.9986619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43706 samples/s/p 5:53:43 } +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 203/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.9986351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43344 samples/s/p 5:53:54 } +2024-07-25 19:14:07,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 205/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9986079e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:07,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43744 samples/s/p 5:53:35 } +2024-07-25 19:14:10,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 207/ 1625], loss: 1.261, per_step_time: 1474ms, lr: 2.9985804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:10,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42717 samples/s/p 5:54:13 } +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 209/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9985527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43216 samples/s/p 5:53:50 } +2024-07-25 19:14:15,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 211/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9985247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:15,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42664 samples/s/p 5:54:09 } +2024-07-25 19:14:18,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 213/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.9984965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:18,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43649 samples/s/p 5:53:27 } +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 215/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9984682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43309 samples/s/p 5:53:38 } +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 217/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.9984394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43706 samples/s/p 5:53:19 } +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 219/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9984103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43099 samples/s/p 5:53:40 } +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 221/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.998381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43656 samples/s/p 5:53:15 } +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 223/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9983512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43351 samples/s/p 5:53:24 } +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 225/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9983215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43426 samples/s/p 5:53:18 } +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 227/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9982915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43371 samples/s/p 5:53:18 } +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 229/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.9982612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43847 samples/s/p 5:52:56 } +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 231/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.9982306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42873 samples/s/p 5:53:31 } +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 233/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9981999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43323 samples/s/p 5:53:11 } +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 235/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.9981686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:51,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42859 samples/s/p 5:53:26 } +2024-07-25 19:14:54,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 237/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.998137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:54,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43583 samples/s/p 5:52:55 } +2024-07-25 19:14:57,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 239/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.9981054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:57,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.44132 samples/s/p 5:52:30 } +2024-07-25 19:15:00,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 241/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.9980733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:00,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43754 samples/s/p 5:52:42 } +2024-07-25 19:15:03,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 243/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.9980412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42812 samples/s/p 5:53:16 } +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 245/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 2.9980087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42845 samples/s/p 5:53:12 } +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 247/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.997976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42761 samples/s/p 5:53:12 } +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 249/ 1625], loss: 1.375, per_step_time: 1472ms, lr: 2.9979428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:12,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43263 samples/s/p 5:52:49 } +2024-07-25 19:15:14,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 251/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.9979094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:14,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43413 samples/s/p 5:52:41 } +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 253/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 2.9978759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44089 samples/s/p 5:52:11 } +2024-07-25 19:15:20,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 255/ 1625], loss: 1.137, per_step_time: 1469ms, lr: 2.997842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:20,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44225 samples/s/p 5:52:03 } +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 257/ 1625], loss: 1.338, per_step_time: 1472ms, lr: 2.9978082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:23,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43309 samples/s/p 5:52:36 } +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 259/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.9977735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43810 samples/s/p 5:52:13 } +2024-07-25 19:15:29,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 261/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 2.997739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:29,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44029 samples/s/p 5:52:02 } +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 263/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.997704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44006 samples/s/p 5:52:00 } +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 265/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9976689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43441 samples/s/p 5:52:19 } +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 267/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 2.9976336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43716 samples/s/p 5:52:05 } +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 269/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.9975978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43254 samples/s/p 5:52:20 } +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 271/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9975616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43898 samples/s/p 5:51:52 } +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 273/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9975256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43645 samples/s/p 5:51:59 } +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 275/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.997489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43475 samples/s/p 5:52:03 } +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 277/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.997452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43262 samples/s/p 5:52:08 } +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 279/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9974155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:56,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43299 samples/s/p 5:52:04 } +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 281/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9973779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43890 samples/s/p 5:51:38 } +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 283/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.9973404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43518 samples/s/p 5:51:49 } +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 285/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.9973024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.44070 samples/s/p 5:51:25 } +2024-07-25 19:16:08,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 287/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.9972643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43541 samples/s/p 5:51:43 } +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 289/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.997226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:11,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.42817 samples/s/p 5:52:08 } +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 291/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9971872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43196 samples/s/p 5:51:50 } +2024-07-25 19:16:16,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 293/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9971485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:16,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43189 samples/s/p 5:51:47 } +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 295/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.9971094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:19,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43150 samples/s/p 5:51:46 } +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 297/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.9970697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43870 samples/s/p 5:51:15 } +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 299/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.9970299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:25,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43831 samples/s/p 5:51:14 } +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 301/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.9969902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43132 samples/s/p 5:51:38 } +2024-07-25 19:16:31,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 303/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.99695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:31,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42664 samples/s/p 5:51:53 } +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 305/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9969093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:34,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43579 samples/s/p 5:51:15 } +2024-07-25 19:16:37,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 307/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9968685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:37,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44151 samples/s/p 5:50:50 } +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 309/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9968276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:40,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43293 samples/s/p 5:51:20 } +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 311/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9967863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:43,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43892 samples/s/p 5:50:54 } +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 313/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.9967445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:46,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43167 samples/s/p 5:51:19 } +2024-07-25 19:16:49,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 315/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.9967028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:49,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44379 samples/s/p 5:50:29 } +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 317/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.9966604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42961 samples/s/p 5:51:21 } +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 319/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9966182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43536 samples/s/p 5:50:56 } +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9965757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43349 samples/s/p 5:51:00 } +2024-07-25 19:17:01,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 323/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9965326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:01,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43024 samples/s/p 5:51:10 } +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 325/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.9964896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:04,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.44032 samples/s/p 5:50:28 } +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 327/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.996446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.42776 samples/s/p 5:51:13 } +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 329/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9964021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43757 samples/s/p 5:50:32 } +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 331/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.9963583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:13,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43406 samples/s/p 5:50:43 } +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 333/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.996314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43367 samples/s/p 5:50:42 } +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 335/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.9962694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43509 samples/s/p 5:50:33 } +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 337/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.9962248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43104 samples/s/p 5:50:46 } +2024-07-25 19:17:24,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 339/ 1625], loss: 1.010, per_step_time: 1470ms, lr: 2.9961797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:24,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43930 samples/s/p 5:50:11 } +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 341/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.9961344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43989 samples/s/p 5:50:06 } +2024-07-25 19:17:30,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 343/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.9960887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:30,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43344 samples/s/p 5:50:28 } +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 345/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.9960429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43741 samples/s/p 5:50:10 } +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 347/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.9959969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43337 samples/s/p 5:50:22 } +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 349/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9959503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43261 samples/s/p 5:50:22 } +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 351/ 1625], loss: 1.294, per_step_time: 1470ms, lr: 2.9959036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43896 samples/s/p 5:49:55 } +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 353/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.995857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43250 samples/s/p 5:50:17 } +2024-07-25 19:17:48,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 355/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.9958097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:48,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43532 samples/s/p 5:50:03 } +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 357/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 2.9957622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.44102 samples/s/p 5:49:38 } +2024-07-25 19:17:54,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 359/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.9957146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:54,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43141 samples/s/p 5:50:12 } +2024-07-25 19:17:57,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 361/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9956665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:57,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43682 samples/s/p 5:49:48 } +2024-07-25 19:18:00,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 363/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.9956182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:00,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43534 samples/s/p 5:49:51 } +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 365/ 1625], loss: 1.378, per_step_time: 1472ms, lr: 2.9955698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43215 samples/s/p 5:50:00 } +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 367/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.995521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43660 samples/s/p 5:49:40 } +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 369/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.995472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43361 samples/s/p 5:49:49 } +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 371/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9954224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43300 samples/s/p 5:49:48 } +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 373/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9953728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43308 samples/s/p 5:49:45 } +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 375/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.995323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43113 samples/s/p 5:49:50 } +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 377/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9952727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43275 samples/s/p 5:49:40 } +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 379/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.9952223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43182 samples/s/p 5:49:41 } +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 381/ 1625], loss: 1.076, per_step_time: 1469ms, lr: 2.9951718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.44404 samples/s/p 5:48:51 } +2024-07-25 19:18:29,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 383/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.995121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:29,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43654 samples/s/p 5:49:17 } +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 385/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.9950697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42874 samples/s/p 5:49:44 } +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 387/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9950183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43867 samples/s/p 5:49:03 } +2024-07-25 19:18:38,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 389/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.9949666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:38,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43111 samples/s/p 5:49:29 } +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 391/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.9949146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:41,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43210 samples/s/p 5:49:22 } +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 393/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.9948624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42833 samples/s/p 5:49:34 } +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 395/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.9948098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.44253 samples/s/p 5:48:36 } +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 397/ 1625], loss: 1.052, per_step_time: 1473ms, lr: 2.9947569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42750 samples/s/p 5:49:31 } +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 399/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.9947041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43584 samples/s/p 5:48:56 } +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 401/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.9946505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43538 samples/s/p 5:48:55 } +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 403/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.994597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.44018 samples/s/p 5:48:33 } +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 405/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.994543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.42799 samples/s/p 5:49:18 } +2024-07-25 19:19:05,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 407/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 2.994489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:05,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43911 samples/s/p 5:48:32 } +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 409/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.9944347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43335 samples/s/p 5:48:51 } +2024-07-25 19:19:11,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 411/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 2.9943802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:11,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43973 samples/s/p 5:48:23 } +2024-07-25 19:19:13,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 413/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9943252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43305 samples/s/p 5:48:46 } +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 415/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.9942697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43722 samples/s/p 5:48:27 } +2024-07-25 19:19:19,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 417/ 1625], loss: 0.937, per_step_time: 1472ms, lr: 2.994214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:19,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43459 samples/s/p 5:48:34 } +2024-07-25 19:19:22,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 419/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.9941586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42920 samples/s/p 5:48:52 } +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 421/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 2.9941026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43931 samples/s/p 5:48:10 } +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 423/ 1625], loss: 1.266, per_step_time: 1469ms, lr: 2.9940466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44459 samples/s/p 5:47:47 } +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 425/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.9939898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:31,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43627 samples/s/p 5:48:16 } +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 427/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9939329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43031 samples/s/p 5:48:36 } +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 429/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9938761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42952 samples/s/p 5:48:36 } +2024-07-25 19:19:40,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 431/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.9938186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43492 samples/s/p 5:48:13 } +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 433/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9937613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43775 samples/s/p 5:47:59 } +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 435/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9937031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43364 samples/s/p 5:48:12 } +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 437/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9936451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43623 samples/s/p 5:47:59 } +2024-07-25 19:19:52,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 439/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.9935867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:52,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43553 samples/s/p 5:47:58 } +2024-07-25 19:19:55,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.993528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:55,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.44242 samples/s/p 5:47:29 } +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 443/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9934692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43405 samples/s/p 5:47:58 } +2024-07-25 19:20:01,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 445/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.9934099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:01,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43505 samples/s/p 5:47:51 } +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 447/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.9933506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:04,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43221 samples/s/p 5:47:59 } +2024-07-25 19:20:07,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 449/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.9932908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:07,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43306 samples/s/p 5:47:53 } +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 451/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:10,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43382 samples/s/p 5:47:47 } +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 453/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9931705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:13,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43122 samples/s/p 5:47:54 } +2024-07-25 19:20:15,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 455/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.99311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:15,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43097 samples/s/p 5:47:52 } +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 457/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.9930492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43618 samples/s/p 5:47:29 } +2024-07-25 19:20:21,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 459/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.992988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:21,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43158 samples/s/p 5:47:44 } +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 461/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9929268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.42486 samples/s/p 5:48:07 } +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 463/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.9928653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.44084 samples/s/p 5:47:03 } +2024-07-25 19:20:30,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 465/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.9928033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.42965 samples/s/p 5:47:43 } +2024-07-25 19:20:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 467/ 1625], loss: 1.345, per_step_time: 1472ms, lr: 2.9927412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43282 samples/s/p 5:47:28 } +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 469/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9926789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:36,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43523 samples/s/p 5:47:15 } +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 471/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.9926163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43555 samples/s/p 5:47:11 } +2024-07-25 19:20:42,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 473/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 2.9925533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:42,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43751 samples/s/p 5:47:01 } +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 475/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.99249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.44539 samples/s/p 5:46:28 } +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 477/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.9924267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43709 samples/s/p 5:46:57 } +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 479/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9923629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43660 samples/s/p 5:46:55 } +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 481/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.9922989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43234 samples/s/p 5:47:09 } +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 483/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.9922347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43308 samples/s/p 5:47:03 } +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 485/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.9921703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:00,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43967 samples/s/p 5:46:35 } +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 487/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.9921053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43173 samples/s/p 5:47:02 } +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 489/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.9920404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43092 samples/s/p 5:47:03 } +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 491/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.991975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43549 samples/s/p 5:46:42 } +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 493/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 2.9919096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44295 samples/s/p 5:46:11 } +2024-07-25 19:21:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 495/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9918436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43071 samples/s/p 5:46:54 } +2024-07-25 19:21:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 497/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9917775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:17,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43842 samples/s/p 5:46:22 } +2024-07-25 19:21:20,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 499/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.9917113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:20,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43633 samples/s/p 5:46:27 } +2024-07-25 19:21:23,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 501/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.9916446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:23,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43686 samples/s/p 5:46:22 } +2024-07-25 19:21:26,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 503/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9915775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:26,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43366 samples/s/p 5:46:31 } +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 505/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9915103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43609 samples/s/p 5:46:19 } +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 507/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.991443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.42916 samples/s/p 5:46:43 } +2024-07-25 19:21:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 509/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9913752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:35,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43816 samples/s/p 5:46:05 } +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 511/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.9913072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43572 samples/s/p 5:46:12 } +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 513/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.991239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:41,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43398 samples/s/p 5:46:15 } +2024-07-25 19:21:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 515/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.9911704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:44,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43827 samples/s/p 5:45:56 } +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 517/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.9911018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.42950 samples/s/p 5:46:27 } +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 519/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9910327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:50,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43527 samples/s/p 5:46:02 } +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 521/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9909634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43397 samples/s/p 5:46:04 } +2024-07-25 19:21:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 523/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9908939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43191 samples/s/p 5:46:09 } +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 525/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9908242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43556 samples/s/p 5:45:52 } +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 527/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.9907538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.44082 samples/s/p 5:45:29 } +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 529/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9906834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43076 samples/s/p 5:46:04 } +2024-07-25 19:22:08,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 531/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.9906128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:08,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43456 samples/s/p 5:45:47 } +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 533/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.990542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.42900 samples/s/p 5:46:05 } +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 535/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.9904708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43289 samples/s/p 5:45:47 } +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 537/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.9903993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43620 samples/s/p 5:45:32 } +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9903278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43334 samples/s/p 5:45:40 } +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 541/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9902556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43266 samples/s/p 5:45:39 } +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 543/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.9901834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43499 samples/s/p 5:45:27 } +2024-07-25 19:22:28,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 545/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 2.990111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:28,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44079 samples/s/p 5:45:02 } +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 547/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 2.990038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43183 samples/s/p 5:45:34 } +2024-07-25 19:22:34,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 549/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9899651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:34,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43402 samples/s/p 5:45:22 } +2024-07-25 19:22:37,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 551/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.9898918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:37,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43097 samples/s/p 5:45:31 } +2024-07-25 19:22:40,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 553/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.9898185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:40,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43820 samples/s/p 5:45:00 } +2024-07-25 19:22:43,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 555/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.9897445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:43,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44060 samples/s/p 5:44:48 } +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 557/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 2.9896704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43032 samples/s/p 5:45:25 } +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 559/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9895962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.42918 samples/s/p 5:45:26 } +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 561/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9895215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43594 samples/s/p 5:44:57 } +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 563/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.9894465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.44038 samples/s/p 5:44:37 } +2024-07-25 19:22:58,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 565/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 2.9893716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:58,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43048 samples/s/p 5:45:12 } +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 567/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.9892959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:01,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43540 samples/s/p 5:44:51 } +2024-07-25 19:23:04,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 569/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9892202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:04,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43703 samples/s/p 5:44:41 } +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 571/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.9891444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43574 samples/s/p 5:44:43 } +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 573/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9890682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:10,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43773 samples/s/p 5:44:33 } +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 575/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9889916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43427 samples/s/p 5:44:43 } +2024-07-25 19:23:15,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 577/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9889148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:15,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43200 samples/s/p 5:44:49 } +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 579/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9888379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:18,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43873 samples/s/p 5:44:20 } +2024-07-25 19:23:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 581/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9887606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:21,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43459 samples/s/p 5:44:33 } +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 583/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.988683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43586 samples/s/p 5:44:25 } +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 585/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.9886052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43634 samples/s/p 5:44:20 } +2024-07-25 19:23:30,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 587/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 2.9885274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:30,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43038 samples/s/p 5:44:40 } +2024-07-25 19:23:33,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 589/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.9884488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:33,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43386 samples/s/p 5:44:24 } +2024-07-25 19:23:36,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 591/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9883704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:36,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43229 samples/s/p 5:44:27 } +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 593/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.988291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42781 samples/s/p 5:44:41 } +2024-07-25 19:23:42,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 595/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.988212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:42,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43723 samples/s/p 5:44:02 } +2024-07-25 19:23:45,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 597/ 1625], loss: 1.282, per_step_time: 1473ms, lr: 2.9881328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:45,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43095 samples/s/p 5:44:23 } +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 599/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.9880532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.44023 samples/s/p 5:43:45 } +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 601/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.9879731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43605 samples/s/p 5:43:58 } +2024-07-25 19:23:54,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 603/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 2.9878931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:54,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43562 samples/s/p 5:43:57 } +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 605/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 2.9878125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43373 samples/s/p 5:44:01 } +2024-07-25 19:24:00,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 607/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.9877318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:00,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43015 samples/s/p 5:44:12 } +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 609/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.987651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:03,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43162 samples/s/p 5:44:03 } +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 611/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.9875695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43126 samples/s/p 5:44:01 } +2024-07-25 19:24:09,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 613/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9874882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:09,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43588 samples/s/p 5:43:41 } +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 615/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9874062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.42742 samples/s/p 5:44:10 } +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 617/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9873243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43492 samples/s/p 5:43:39 } +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 619/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.9872419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43690 samples/s/p 5:43:28 } +2024-07-25 19:24:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 621/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.9871593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:20,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43530 samples/s/p 5:43:31 } +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 623/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9870764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43342 samples/s/p 5:43:36 } +2024-07-25 19:24:26,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 625/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.9869934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:26,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43216 samples/s/p 5:43:37 } +2024-07-25 19:24:29,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 627/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9869097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:29,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43317 samples/s/p 5:43:31 } +2024-07-25 19:24:32,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 629/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.986826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:32,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43469 samples/s/p 5:43:22 } +2024-07-25 19:24:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 631/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 2.9867424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:35,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42952 samples/s/p 5:43:39 } +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 633/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.986658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43518 samples/s/p 5:43:14 } +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 635/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 2.9865738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43935 samples/s/p 5:42:55 } +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 637/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.986489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43715 samples/s/p 5:43:01 } +2024-07-25 19:24:47,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 639/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9864039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:47,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.44097 samples/s/p 5:42:43 } +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 641/ 1625], loss: 1.287, per_step_time: 1474ms, lr: 2.9863188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42405 samples/s/p 5:43:45 } +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 643/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9862333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43256 samples/s/p 5:43:09 } +2024-07-25 19:24:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 645/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.9861474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:56,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43542 samples/s/p 5:42:56 } +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 2.9860614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.44163 samples/s/p 5:42:29 } +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 649/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9859752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:02,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43709 samples/s/p 5:42:43 } +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9858886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:05,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43486 samples/s/p 5:42:49 } +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 653/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.9858018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:08,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43409 samples/s/p 5:42:49 } +2024-07-25 19:25:11,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 655/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 2.9857147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:11,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43844 samples/s/p 5:42:30 } +2024-07-25 19:25:14,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 657/ 1625], loss: 1.191, per_step_time: 1476ms, lr: 2.9856272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:14,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.41957 samples/s/p 5:43:38 } +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 659/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.9855397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43612 samples/s/p 5:42:32 } +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 661/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9854516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43334 samples/s/p 5:42:40 } +2024-07-25 19:25:22,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 663/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.9853638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:22,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42792 samples/s/p 5:42:58 } +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 665/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9852752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43134 samples/s/p 5:42:42 } +2024-07-25 19:25:28,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 667/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.9851866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:28,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43636 samples/s/p 5:42:20 } +2024-07-25 19:25:31,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 669/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.9850975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:31,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43162 samples/s/p 5:42:35 } +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 671/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.9850084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43752 samples/s/p 5:42:09 } +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 673/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.984919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43318 samples/s/p 5:42:23 } +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 675/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.9848292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43435 samples/s/p 5:42:16 } +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 677/ 1625], loss: 1.058, per_step_time: 1473ms, lr: 2.984739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43070 samples/s/p 5:42:26 } +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 679/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9846487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43505 samples/s/p 5:42:07 } +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 681/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.9845582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.42837 samples/s/p 5:42:29 } +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 683/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 2.9844676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43121 samples/s/p 5:42:16 } +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 685/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.9843766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43797 samples/s/p 5:41:47 } +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 687/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.9842851e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:58,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43788 samples/s/p 5:41:45 } +2024-07-25 19:26:01,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 689/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9841935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:01,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43228 samples/s/p 5:42:03 } +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 691/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 2.9841016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43076 samples/s/p 5:42:06 } +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 693/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9840096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43469 samples/s/p 5:41:48 } +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 695/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 2.9839173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:10,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42840 samples/s/p 5:42:09 } +2024-07-25 19:26:13,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 697/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9838244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:13,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43300 samples/s/p 5:41:48 } +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 699/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.9837316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42954 samples/s/p 5:41:58 } +2024-07-25 19:26:18,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 701/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9836385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:18,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43678 samples/s/p 5:41:28 } +2024-07-25 19:26:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 703/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.9835448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:21,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.44111 samples/s/p 5:41:09 } +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 705/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.9834513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43344 samples/s/p 5:41:35 } +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 707/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9833573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43294 samples/s/p 5:41:34 } +2024-07-25 19:26:30,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 709/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.9832629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:30,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43035 samples/s/p 5:41:41 } +2024-07-25 19:26:33,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 711/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.9831685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:33,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43122 samples/s/p 5:41:34 } +2024-07-25 19:26:36,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 713/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9830737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:36,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43330 samples/s/p 5:41:24 } +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 715/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.9829787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43525 samples/s/p 5:41:13 } +2024-07-25 19:26:42,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 717/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.9828832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43498 samples/s/p 5:41:11 } +2024-07-25 19:26:45,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 719/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.982788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:45,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43346 samples/s/p 5:41:14 } +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 721/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.982692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43183 samples/s/p 5:41:17 } +2024-07-25 19:26:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 723/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.982596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43207 samples/s/p 5:41:13 } +2024-07-25 19:26:54,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 725/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 2.9824996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43087 samples/s/p 5:41:15 } +2024-07-25 19:26:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 727/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.9824028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43270 samples/s/p 5:41:05 } +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 729/ 1625], loss: 1.359, per_step_time: 1474ms, lr: 2.9823059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42660 samples/s/p 5:41:25 } +2024-07-25 19:27:03,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 731/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.9822088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:03,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43556 samples/s/p 5:40:49 } +2024-07-25 19:27:06,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 733/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9821114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:06,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43279 samples/s/p 5:40:56 } +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 735/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9820138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43850 samples/s/p 5:40:32 } +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 737/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.9819159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:12,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43527 samples/s/p 5:40:41 } +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 739/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9818177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43029 samples/s/p 5:40:57 } +2024-07-25 19:27:18,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 741/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9817189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:18,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43133 samples/s/p 5:40:50 } +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 743/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.9816205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43199 samples/s/p 5:40:44 } +2024-07-25 19:27:23,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 745/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.9815214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:23,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.44128 samples/s/p 5:40:06 } +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 747/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.9814222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:26,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43354 samples/s/p 5:40:33 } +2024-07-25 19:27:29,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 749/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 2.9813224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42751 samples/s/p 5:40:52 } +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 751/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.9812229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42498 samples/s/p 5:40:59 } +2024-07-25 19:27:35,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 753/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9811226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:35,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43167 samples/s/p 5:40:31 } +2024-07-25 19:27:38,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 755/ 1625], loss: 1.218, per_step_time: 1481ms, lr: 2.9810224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.39867 samples/s/p 5:42:33 } +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 757/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9809218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43061 samples/s/p 5:40:29 } +2024-07-25 19:27:44,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 759/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.9808209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43008 samples/s/p 5:40:28 } +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 761/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 2.98072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43043 samples/s/p 5:40:24 } +2024-07-25 19:27:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 763/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9806186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42947 samples/s/p 5:40:24 } +2024-07-25 19:27:53,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 765/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9805167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:53,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43512 samples/s/p 5:40:00 } +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 767/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.9804149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43387 samples/s/p 5:40:02 } +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 769/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.9803128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42798 samples/s/p 5:40:21 } +2024-07-25 19:28:02,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 771/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.9802102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43031 samples/s/p 5:40:09 } +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 773/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.9801076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43443 samples/s/p 5:39:51 } +2024-07-25 19:28:08,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 775/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.9800045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:08,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44266 samples/s/p 5:39:17 } +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 777/ 1625], loss: 1.292, per_step_time: 1474ms, lr: 2.9799015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42644 samples/s/p 5:40:15 } +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 779/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.9797979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43992 samples/s/p 5:39:22 } +2024-07-25 19:28:17,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 781/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.9796942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43544 samples/s/p 5:39:35 } +2024-07-25 19:28:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 783/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9795901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43036 samples/s/p 5:39:52 } +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 785/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9794859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43427 samples/s/p 5:39:34 } +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 787/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9793813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42859 samples/s/p 5:39:52 } +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 789/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9792765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43674 samples/s/p 5:39:19 } +2024-07-25 19:28:31,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 791/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9791714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:31,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43298 samples/s/p 5:39:30 } +2024-07-25 19:28:34,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 793/ 1625], loss: 0.885, per_step_time: 1470ms, lr: 2.979066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:34,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.44195 samples/s/p 5:38:53 } +2024-07-25 19:28:37,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 795/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9789604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43646 samples/s/p 5:39:11 } +2024-07-25 19:28:40,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 797/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.9788547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:40,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43664 samples/s/p 5:39:07 } +2024-07-25 19:28:43,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 799/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9787485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:43,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43482 samples/s/p 5:39:11 } +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 801/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 2.978642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43410 samples/s/p 5:39:11 } +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 803/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9785355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43861 samples/s/p 5:38:51 } +2024-07-25 19:28:52,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 805/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9784285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:52,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43787 samples/s/p 5:38:51 } +2024-07-25 19:28:55,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 807/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9783214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:55,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43662 samples/s/p 5:38:53 } +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 809/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9782139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:58,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43278 samples/s/p 5:39:04 } +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 811/ 1625], loss: 1.009, per_step_time: 1470ms, lr: 2.9781062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43879 samples/s/p 5:38:39 } +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 813/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.9779982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.42911 samples/s/p 5:39:12 } +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 815/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.97789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43436 samples/s/p 5:38:49 } +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 817/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9777813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43148 samples/s/p 5:38:57 } +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 819/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.9776727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:13,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43420 samples/s/p 5:38:44 } +2024-07-25 19:29:16,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 821/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.9775636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:16,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43483 samples/s/p 5:38:39 } +2024-07-25 19:29:19,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 823/ 1625], loss: 1.268, per_step_time: 1470ms, lr: 2.9774543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:19,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43904 samples/s/p 5:38:20 } +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 825/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9773448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.44069 samples/s/p 5:38:11 } +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 827/ 1625], loss: 1.146, per_step_time: 1477ms, lr: 2.977235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.41472 samples/s/p 5:39:45 } +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 829/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.9771249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43943 samples/s/p 5:38:10 } +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 831/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.9770146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43611 samples/s/p 5:38:19 } +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 833/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.9769039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.42993 samples/s/p 5:38:39 } +2024-07-25 19:29:36,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 835/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.9767929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:36,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43912 samples/s/p 5:38:02 } +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 837/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 2.976682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42865 samples/s/p 5:38:38 } +2024-07-25 19:29:42,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 839/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.9765704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:42,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43598 samples/s/p 5:38:08 } +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 841/ 1625], loss: 0.965, per_step_time: 1472ms, lr: 2.9764587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43253 samples/s/p 5:38:18 } +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 843/ 1625], loss: 1.341, per_step_time: 1470ms, lr: 2.976347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:48,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43977 samples/s/p 5:37:48 } +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 845/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9762348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43045 samples/s/p 5:38:20 } +2024-07-25 19:29:54,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 847/ 1625], loss: 1.444, per_step_time: 1471ms, lr: 2.9761222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:54,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43505 samples/s/p 5:38:00 } +2024-07-25 19:29:57,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 849/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9760096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:57,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43321 samples/s/p 5:38:04 } +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 851/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.9758965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43195 samples/s/p 5:38:05 } +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 853/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9757832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42953 samples/s/p 5:38:11 } +2024-07-25 19:30:06,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 855/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.9756698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:06,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43620 samples/s/p 5:37:44 } +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 857/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.975556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43410 samples/s/p 5:37:49 } +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 859/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.975442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:12,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43604 samples/s/p 5:37:38 } +2024-07-25 19:30:15,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 861/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9753279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:15,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43558 samples/s/p 5:37:37 } +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 863/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9752133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42851 samples/s/p 5:38:01 } +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 865/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9750983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:21,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42497 samples/s/p 5:38:11 } +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 867/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.9749832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43904 samples/s/p 5:37:15 } +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 869/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.9748679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43525 samples/s/p 5:37:27 } +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 871/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.9747522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44180 samples/s/p 5:36:59 } +2024-07-25 19:30:32,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 873/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.9746365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:32,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43610 samples/s/p 5:37:18 } +2024-07-25 19:30:35,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 875/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.9745202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43842 samples/s/p 5:37:06 } +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 877/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9744038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43453 samples/s/p 5:37:18 } +2024-07-25 19:30:41,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 879/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9742872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:41,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43421 samples/s/p 5:37:16 } +2024-07-25 19:30:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 881/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9741705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:44,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43788 samples/s/p 5:36:59 } +2024-07-25 19:30:47,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 883/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 2.9740533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:47,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43604 samples/s/p 5:37:03 } +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 885/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 2.9739356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44144 samples/s/p 5:36:40 } +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 887/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9738178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43498 samples/s/p 5:37:01 } +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 889/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.9736999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43787 samples/s/p 5:36:47 } +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 891/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9735816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42951 samples/s/p 5:37:16 } +2024-07-25 19:31:02,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 893/ 1625], loss: 1.258, per_step_time: 1474ms, lr: 2.973463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:02,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42639 samples/s/p 5:37:24 } +2024-07-25 19:31:05,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 895/ 1625], loss: 1.282, per_step_time: 1470ms, lr: 2.9733445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:05,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43891 samples/s/p 5:36:35 } +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 897/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.9732257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.44003 samples/s/p 5:36:28 } +2024-07-25 19:31:11,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 899/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.973106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43176 samples/s/p 5:36:55 } +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 901/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 2.9729865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42885 samples/s/p 5:37:03 } +2024-07-25 19:31:17,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 903/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9728668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:17,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43555 samples/s/p 5:36:35 } +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 905/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9727466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43560 samples/s/p 5:36:32 } +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 907/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9726263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43656 samples/s/p 5:36:26 } +2024-07-25 19:31:25,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 909/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9725057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:25,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43261 samples/s/p 5:36:38 } +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 911/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.972385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43959 samples/s/p 5:36:09 } +2024-07-25 19:31:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 913/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.9722638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43540 samples/s/p 5:36:21 } +2024-07-25 19:31:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 915/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9721425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43013 samples/s/p 5:36:38 } +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 917/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9720208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43737 samples/s/p 5:36:08 } +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 919/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9718987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.44083 samples/s/p 5:35:52 } +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 921/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9717767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43552 samples/s/p 5:36:09 } +2024-07-25 19:31:46,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 923/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 2.9716544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43530 samples/s/p 5:36:07 } +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 925/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9715315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43098 samples/s/p 5:36:20 } +2024-07-25 19:31:52,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 927/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.9714083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:52,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43495 samples/s/p 5:36:02 } +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 929/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 2.9712852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43384 samples/s/p 5:36:04 } +2024-07-25 19:31:58,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 931/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.9711617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43400 samples/s/p 5:36:00 } +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 933/ 1625], loss: 1.436, per_step_time: 1474ms, lr: 2.971038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.42738 samples/s/p 5:36:22 } +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 935/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9709141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:04,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43183 samples/s/p 5:36:02 } +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 937/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43726 samples/s/p 5:35:39 } +2024-07-25 19:32:10,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 939/ 1625], loss: 1.044, per_step_time: 1481ms, lr: 2.9706653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:10,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.39921 samples/s/p 5:37:58 } +2024-07-25 19:32:13,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 941/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9705405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:13,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43797 samples/s/p 5:35:31 } +2024-07-25 19:32:16,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 943/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9704153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43414 samples/s/p 5:35:42 } +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 945/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.9702898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:19,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43528 samples/s/p 5:35:35 } +2024-07-25 19:32:22,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 947/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.9701643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43857 samples/s/p 5:35:19 } +2024-07-25 19:32:25,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 949/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.9700386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:25,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43358 samples/s/p 5:35:35 } +2024-07-25 19:32:27,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 951/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.9699124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:27,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43310 samples/s/p 5:35:34 } +2024-07-25 19:32:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 953/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9697861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:30,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43564 samples/s/p 5:35:22 } +2024-07-25 19:32:33,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 955/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9696595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:33,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42860 samples/s/p 5:35:45 } +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 957/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9695326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:36,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42963 samples/s/p 5:35:38 } +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 959/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9694054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43252 samples/s/p 5:35:24 } +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 961/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 2.969278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:42,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43047 samples/s/p 5:35:29 } +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.9691504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43024 samples/s/p 5:35:27 } +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 965/ 1625], loss: 1.397, per_step_time: 1483ms, lr: 2.9690224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:48,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.39168 samples/s/p 5:37:48 } +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 967/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9688941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43627 samples/s/p 5:34:59 } +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 969/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.9687657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43524 samples/s/p 5:34:59 } +2024-07-25 19:32:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 971/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.9686367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:57,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43364 samples/s/p 5:35:02 } +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 973/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9685078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:00,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43362 samples/s/p 5:35:00 } +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 975/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 2.9683788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43940 samples/s/p 5:34:35 } +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 977/ 1625], loss: 1.140, per_step_time: 1474ms, lr: 2.9682491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.42569 samples/s/p 5:35:23 } +2024-07-25 19:33:09,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 979/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.9681194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:09,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43860 samples/s/p 5:34:32 } +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 981/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.9679892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43738 samples/s/p 5:34:34 } +2024-07-25 19:33:15,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 983/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.967859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:15,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43219 samples/s/p 5:34:50 } +2024-07-25 19:33:18,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 985/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.9677285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:18,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43239 samples/s/p 5:34:46 } +2024-07-25 19:33:21,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 987/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.9675975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:21,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43315 samples/s/p 5:34:41 } +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 989/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 2.9674666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43247 samples/s/p 5:34:40 } +2024-07-25 19:33:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 991/ 1625], loss: 1.347, per_step_time: 1471ms, lr: 2.967335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:27,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43816 samples/s/p 5:34:16 } +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 993/ 1625], loss: 1.390, per_step_time: 1472ms, lr: 2.9672035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43372 samples/s/p 5:34:30 } +2024-07-25 19:33:32,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 995/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.9670717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:32,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.44049 samples/s/p 5:34:02 } +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 997/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.9669396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43290 samples/s/p 5:34:27 } +2024-07-25 19:33:38,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 999/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 2.9668072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:38,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43744 samples/s/p 5:34:07 } +2024-07-25 19:33:41,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1001/ 1625], loss: 0.931, per_step_time: 1471ms, lr: 2.9666744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:41,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43598 samples/s/p 5:34:10 } +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1003/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9665418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43583 samples/s/p 5:34:07 } +2024-07-25 19:33:47,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1005/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9664083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:47,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42817 samples/s/p 5:34:33 } +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1007/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 2.966275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.44355 samples/s/p 5:33:33 } +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1009/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9661414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43517 samples/s/p 5:34:01 } +2024-07-25 19:33:56,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1011/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9660072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:56,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43527 samples/s/p 5:33:58 } +2024-07-25 19:33:59,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1013/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9658731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:59,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43025 samples/s/p 5:34:13 } +2024-07-25 19:34:02,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1015/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.9657387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43432 samples/s/p 5:33:55 } +2024-07-25 19:34:05,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1017/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 2.9656037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:05,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.42619 samples/s/p 5:34:22 } +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1019/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 2.9654688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.44035 samples/s/p 5:33:27 } +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1021/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.9653334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43149 samples/s/p 5:33:57 } +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1023/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9651981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:14,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43150 samples/s/p 5:33:54 } +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1025/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.965062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43419 samples/s/p 5:33:41 } +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1027/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 2.964926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43038 samples/s/p 5:33:52 } +2024-07-25 19:34:23,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1029/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.9647897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:23,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43427 samples/s/p 5:33:35 } +2024-07-25 19:34:26,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1031/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9646533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43201 samples/s/p 5:33:40 } +2024-07-25 19:34:29,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1033/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9645162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:29,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43250 samples/s/p 5:33:35 } +2024-07-25 19:34:31,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1035/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 2.9643794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:31,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43009 samples/s/p 5:33:41 } +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1037/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.964242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:34,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43501 samples/s/p 5:33:20 } +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1039/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.9641044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43226 samples/s/p 5:33:27 } +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1041/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9639665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43266 samples/s/p 5:33:23 } +2024-07-25 19:34:43,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1043/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9638284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:43,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43559 samples/s/p 5:33:09 } +2024-07-25 19:34:46,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1045/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.96369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.42897 samples/s/p 5:33:31 } +2024-07-25 19:34:49,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1047/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.9635514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:49,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43511 samples/s/p 5:33:05 } +2024-07-25 19:34:52,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1049/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.9634124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:52,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43789 samples/s/p 5:32:52 } +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1051/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.963273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43484 samples/s/p 5:33:00 } +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1053/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9631337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43654 samples/s/p 5:32:51 } +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1055/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.962994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:01,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44174 samples/s/p 5:32:29 } +2024-07-25 19:35:04,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1057/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.962854e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:04,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44023 samples/s/p 5:32:32 } +2024-07-25 19:35:07,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1059/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.9627137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:07,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43449 samples/s/p 5:32:50 } +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1061/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9625733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43374 samples/s/p 5:32:50 } +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1063/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.9624325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43926 samples/s/p 5:32:26 } +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1065/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.9622914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43384 samples/s/p 5:32:43 } +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1067/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9621502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:19,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43439 samples/s/p 5:32:38 } +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1069/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9620089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43360 samples/s/p 5:32:38 } +2024-07-25 19:35:25,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1071/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.961867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:25,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43591 samples/s/p 5:32:27 } +2024-07-25 19:35:28,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1073/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.961725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:28,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43559 samples/s/p 5:32:25 } +2024-07-25 19:35:30,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1075/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9615825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:30,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43346 samples/s/p 5:32:30 } +2024-07-25 19:35:33,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1077/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9614399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:33,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.44164 samples/s/p 5:31:57 } +2024-07-25 19:35:36,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1079/ 1625], loss: 1.244, per_step_time: 1475ms, lr: 2.961297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.42110 samples/s/p 5:33:10 } +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1081/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9611541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43107 samples/s/p 5:32:30 } +2024-07-25 19:35:42,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1083/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9610108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:42,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43607 samples/s/p 5:32:09 } +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1085/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.960867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43366 samples/s/p 5:32:14 } +2024-07-25 19:35:48,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1087/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 2.9607232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43788 samples/s/p 5:31:56 } +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1089/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.960579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43645 samples/s/p 5:31:58 } +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1091/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 2.9604347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43651 samples/s/p 5:31:55 } +2024-07-25 19:35:57,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1093/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.96029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:57,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.42802 samples/s/p 5:32:23 } +2024-07-25 19:36:00,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1095/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.9601451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43285 samples/s/p 5:32:03 } +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1097/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.96e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:03,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43347 samples/s/p 5:31:58 } +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1099/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.9598543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42689 samples/s/p 5:32:19 } +2024-07-25 19:36:09,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1101/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9597088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:09,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43955 samples/s/p 5:31:29 } +2024-07-25 19:36:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1103/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9595627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42713 samples/s/p 5:32:12 } +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1105/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.9594165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43508 samples/s/p 5:31:40 } +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1107/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9592702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43123 samples/s/p 5:31:51 } +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1109/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.9591232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42933 samples/s/p 5:31:55 } +2024-07-25 19:36:24,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.9589763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:24,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43078 samples/s/p 5:31:47 } +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1113/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 2.958829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42962 samples/s/p 5:31:48 } +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1115/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.9586816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43935 samples/s/p 5:31:10 } +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1117/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 2.9585337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43075 samples/s/p 5:31:38 } +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1119/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9583858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43327 samples/s/p 5:31:26 } +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1121/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9582376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43383 samples/s/p 5:31:21 } +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1123/ 1625], loss: 1.430, per_step_time: 1471ms, lr: 2.9580888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43621 samples/s/p 5:31:09 } +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1125/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.95794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43495 samples/s/p 5:31:11 } +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1127/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.9577908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.44529 samples/s/p 5:30:30 } +2024-07-25 19:36:50,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1129/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9576418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:50,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43112 samples/s/p 5:31:19 } +2024-07-25 19:36:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9574921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43535 samples/s/p 5:31:01 } +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1133/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.957342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43065 samples/s/p 5:31:15 } +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1135/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.957192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43720 samples/s/p 5:30:48 } +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1137/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.9570418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:02,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43902 samples/s/p 5:30:38 } +2024-07-25 19:37:05,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1139/ 1625], loss: 1.414, per_step_time: 1471ms, lr: 2.9568911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:05,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43499 samples/s/p 5:30:50 } +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1141/ 1625], loss: 1.430, per_step_time: 1472ms, lr: 2.9567402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:08,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43360 samples/s/p 5:30:52 } +2024-07-25 19:37:11,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1143/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9565892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:11,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43457 samples/s/p 5:30:46 } +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1145/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.9564375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:14,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.44078 samples/s/p 5:30:20 } +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1147/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.956286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:17,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43572 samples/s/p 5:30:36 } +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9561339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:20,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43036 samples/s/p 5:30:52 } +2024-07-25 19:37:23,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1151/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.9559818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:23,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43435 samples/s/p 5:30:35 } +2024-07-25 19:37:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1153/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.9558292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42947 samples/s/p 5:30:50 } +2024-07-25 19:37:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1155/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9556764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43502 samples/s/p 5:30:26 } +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1157/ 1625], loss: 1.392, per_step_time: 1473ms, lr: 2.9555236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43016 samples/s/p 5:30:41 } +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1159/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9553703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43647 samples/s/p 5:30:15 } +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1161/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.955217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42892 samples/s/p 5:30:40 } +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1163/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 2.9550632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.44250 samples/s/p 5:29:47 } +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1165/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.954909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.42953 samples/s/p 5:30:32 } +2024-07-25 19:37:46,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1167/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.954755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:46,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43436 samples/s/p 5:30:11 } +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1169/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9546003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43531 samples/s/p 5:30:05 } +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1171/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.9544455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:52,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43428 samples/s/p 5:30:06 } +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1173/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9542905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43340 samples/s/p 5:30:06 } +2024-07-25 19:37:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1175/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.954135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43442 samples/s/p 5:29:59 } +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:38:34,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1177/ 1625], loss: 1.273, per_step_time: 1993ms, lr: 2.9539795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:34,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 4.01359 samples/s/p 7:26:44 } +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1179/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.9538238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43598 samples/s/p 5:29:48 } +2024-07-25 19:38:40,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1181/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 2.9536677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:40,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42994 samples/s/p 5:30:07 } +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1183/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9535113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:43,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42603 samples/s/p 5:30:18 } +2024-07-25 19:38:46,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1185/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.9533547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:46,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43303 samples/s/p 5:29:50 } +2024-07-25 19:38:48,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1187/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9531979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:48,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43390 samples/s/p 5:29:43 } +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1189/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.9530409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43849 samples/s/p 5:29:24 } +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1191/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.9528832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43692 samples/s/p 5:29:27 } +2024-07-25 19:38:57,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1193/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.9527255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:57,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42854 samples/s/p 5:29:54 } +2024-07-25 19:39:00,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1195/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 2.952568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:00,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42940 samples/s/p 5:29:48 } +2024-07-25 19:39:03,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1197/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.9524095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:03,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43099 samples/s/p 5:29:39 } +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1199/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 2.9522513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43093 samples/s/p 5:29:37 } +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1201/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 2.9520925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:09,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42292 samples/s/p 5:30:03 } +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1203/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.9519335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:12,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.44043 samples/s/p 5:28:56 } +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1205/ 1625], loss: 1.057, per_step_time: 1472ms, lr: 2.9517743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43260 samples/s/p 5:29:22 } +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1207/ 1625], loss: 1.056, per_step_time: 1474ms, lr: 2.951615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:18,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42554 samples/s/p 5:29:44 } +2024-07-25 19:39:21,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1209/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9514551e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:21,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43269 samples/s/p 5:29:15 } +2024-07-25 19:39:24,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1211/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9512954e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:24,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43222 samples/s/p 5:29:14 } +2024-07-25 19:39:27,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1213/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.951135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:27,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43612 samples/s/p 5:28:57 } +2024-07-25 19:39:30,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1215/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9509745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:30,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43684 samples/s/p 5:28:52 } +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1217/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.9508139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43580 samples/s/p 5:28:52 } +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1219/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.950653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42591 samples/s/p 5:29:25 } +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1221/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9504916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42899 samples/s/p 5:29:11 } +2024-07-25 19:39:42,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1223/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 2.95033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:42,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43026 samples/s/p 5:29:04 } +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1225/ 1625], loss: 1.107, per_step_time: 1474ms, lr: 2.9501683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42668 samples/s/p 5:29:14 } +2024-07-25 19:39:48,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1227/ 1625], loss: 1.176, per_step_time: 1475ms, lr: 2.9500063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:48,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42260 samples/s/p 5:29:26 } +2024-07-25 19:39:50,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1229/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9498437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:50,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43236 samples/s/p 5:28:47 } +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1231/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.9496812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43279 samples/s/p 5:28:43 } +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1233/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9495186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43337 samples/s/p 5:28:38 } +2024-07-25 19:39:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1235/ 1625], loss: 1.037, per_step_time: 1474ms, lr: 2.9493556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42711 samples/s/p 5:28:57 } +2024-07-25 19:40:02,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1237/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9491921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:02,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42586 samples/s/p 5:28:59 } +2024-07-25 19:40:05,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1239/ 1625], loss: 1.031, per_step_time: 1487ms, lr: 2.9490286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.37823 samples/s/p 5:31:51 } +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1241/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9488647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:08,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42637 samples/s/p 5:28:51 } +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1243/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9487004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43727 samples/s/p 5:28:09 } +2024-07-25 19:40:14,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 2.9485363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:14,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42530 samples/s/p 5:28:49 } +2024-07-25 19:40:17,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1247/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.9483715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:17,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42785 samples/s/p 5:28:37 } +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1249/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9482066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:20,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42459 samples/s/p 5:28:46 } +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1251/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.9480416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43481 samples/s/p 5:28:06 } +2024-07-25 19:40:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1253/ 1625], loss: 1.152, per_step_time: 1474ms, lr: 2.9478762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42702 samples/s/p 5:28:31 } +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1255/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 2.9477103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42511 samples/s/p 5:28:35 } +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1257/ 1625], loss: 1.254, per_step_time: 1473ms, lr: 2.9475446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42743 samples/s/p 5:28:24 } +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1259/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.9473786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43321 samples/s/p 5:28:00 } +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1261/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.947212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:38,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43141 samples/s/p 5:28:04 } +2024-07-25 19:40:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1263/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.9470451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43644 samples/s/p 5:27:42 } +2024-07-25 19:40:44,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1265/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.9468785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:44,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43673 samples/s/p 5:27:38 } +2024-07-25 19:40:47,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1267/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9467114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:47,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43352 samples/s/p 5:27:47 } +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1269/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9465436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:50,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43118 samples/s/p 5:27:53 } +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1271/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9463761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43208 samples/s/p 5:27:46 } +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1273/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9462082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43717 samples/s/p 5:27:25 } +2024-07-25 19:40:58,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1275/ 1625], loss: 1.209, per_step_time: 1474ms, lr: 2.94604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:58,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.42390 samples/s/p 5:28:10 } +2024-07-25 19:41:01,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1277/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.9458712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:01,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44028 samples/s/p 5:27:08 } +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1279/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.9457025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43122 samples/s/p 5:27:38 } +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1281/ 1625], loss: 1.315, per_step_time: 1474ms, lr: 2.9455336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.42576 samples/s/p 5:27:55 } +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1283/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9453642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43168 samples/s/p 5:27:30 } +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1285/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9451949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43928 samples/s/p 5:27:00 } +2024-07-25 19:41:16,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1287/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 2.945025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44050 samples/s/p 5:26:52 } +2024-07-25 19:41:19,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1289/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.944855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:19,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43087 samples/s/p 5:27:24 } +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1291/ 1625], loss: 1.329, per_step_time: 1469ms, lr: 2.9446848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44261 samples/s/p 5:26:39 } +2024-07-25 19:41:25,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1293/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 2.9445142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43071 samples/s/p 5:27:19 } +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1295/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.9443434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43559 samples/s/p 5:26:58 } +2024-07-25 19:41:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1297/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.9441722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.42816 samples/s/p 5:27:22 } +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1299/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.9440009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43385 samples/s/p 5:26:59 } +2024-07-25 19:41:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1301/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.9438293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43961 samples/s/p 5:26:35 } +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1303/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.9436576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.42809 samples/s/p 5:27:14 } +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1305/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9434856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43803 samples/s/p 5:26:35 } +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1307/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.943313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43627 samples/s/p 5:26:38 } +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1309/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.9431405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44111 samples/s/p 5:26:18 } +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1311/ 1625], loss: 1.217, per_step_time: 1469ms, lr: 2.9429677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44376 samples/s/p 5:26:05 } +2024-07-25 19:41:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1313/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9427943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:55,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43334 samples/s/p 5:26:40 } +2024-07-25 19:41:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.9426212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43516 samples/s/p 5:26:30 } +2024-07-25 19:42:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1317/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.9424475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.42923 samples/s/p 5:26:49 } +2024-07-25 19:42:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1319/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9422736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:03,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43882 samples/s/p 5:26:11 } +2024-07-25 19:42:06,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1321/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 2.9420993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:06,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43275 samples/s/p 5:26:30 } +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1323/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.941925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43045 samples/s/p 5:26:36 } +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1325/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.9417504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43469 samples/s/p 5:26:17 } +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1327/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.9415754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43161 samples/s/p 5:26:26 } +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1329/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9414003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43611 samples/s/p 5:26:06 } +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1331/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.941225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43653 samples/s/p 5:26:02 } +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1333/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.941049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:24,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43380 samples/s/p 5:26:09 } +2024-07-25 19:42:27,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1335/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9408731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:27,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43279 samples/s/p 5:26:10 } +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1337/ 1625], loss: 1.186, per_step_time: 1480ms, lr: 2.940697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.40299 samples/s/p 5:27:55 } +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1339/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9405206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43378 samples/s/p 5:26:00 } +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1341/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.9403436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43485 samples/s/p 5:25:53 } +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1343/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9401668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42569 samples/s/p 5:26:23 } +2024-07-25 19:42:42,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1345/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.9399896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43021 samples/s/p 5:26:04 } +2024-07-25 19:42:45,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1347/ 1625], loss: 1.154, per_step_time: 1477ms, lr: 2.939812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:45,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.41513 samples/s/p 5:26:56 } +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1349/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9396344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43285 samples/s/p 5:25:49 } +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1351/ 1625], loss: 1.387, per_step_time: 1474ms, lr: 2.9394563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42635 samples/s/p 5:26:09 } +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1353/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 2.939278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42579 samples/s/p 5:26:08 } +2024-07-25 19:42:57,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1355/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.9390996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:57,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43131 samples/s/p 5:25:45 } +2024-07-25 19:42:59,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1357/ 1625], loss: 1.159, per_step_time: 1469ms, lr: 2.9389208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:59,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.44246 samples/s/p 5:25:02 } +2024-07-25 19:43:02,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1359/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.9387418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:02,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42753 samples/s/p 5:25:53 } +2024-07-25 19:43:05,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1361/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.9385625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:05,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43410 samples/s/p 5:25:27 } +2024-07-25 19:43:08,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1363/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.938383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:08,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43479 samples/s/p 5:25:21 } +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1365/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.938203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43584 samples/s/p 5:25:14 } +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1367/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9380231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42929 samples/s/p 5:25:35 } +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1369/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9378429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43277 samples/s/p 5:25:20 } +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1371/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.9376622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43271 samples/s/p 5:25:17 } +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1373/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9374814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43272 samples/s/p 5:25:14 } +2024-07-25 19:43:26,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1375/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.9373005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:26,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43467 samples/s/p 5:25:04 } +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1377/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.937119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:29,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43264 samples/s/p 5:25:08 } +2024-07-25 19:43:32,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1379/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.9369374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:32,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43401 samples/s/p 5:25:00 } +2024-07-25 19:43:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1381/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.9367557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:35,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42622 samples/s/p 5:25:25 } +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1383/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.9365734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42845 samples/s/p 5:25:14 } +2024-07-25 19:43:41,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1385/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9363911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:41,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43690 samples/s/p 5:24:41 } +2024-07-25 19:43:44,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1387/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9362083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:44,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43155 samples/s/p 5:24:57 } +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1389/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9360255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43607 samples/s/p 5:24:38 } +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1391/ 1625], loss: 1.398, per_step_time: 1473ms, lr: 2.9358425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43098 samples/s/p 5:24:54 } +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1393/ 1625], loss: 1.107, per_step_time: 1477ms, lr: 2.9356592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41425 samples/s/p 5:25:51 } +2024-07-25 19:43:56,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1395/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.9354755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:56,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42862 samples/s/p 5:24:56 } +2024-07-25 19:43:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1397/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 2.9352916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42988 samples/s/p 5:24:49 } +2024-07-25 19:44:02,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1399/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.9351077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:02,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43096 samples/s/p 5:24:42 } +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1401/ 1625], loss: 1.078, per_step_time: 1476ms, lr: 2.934923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41853 samples/s/p 5:25:24 } +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1403/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9347384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43582 samples/s/p 5:24:19 } +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1405/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9345534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:10,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43146 samples/s/p 5:24:31 } +2024-07-25 19:44:13,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1407/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.9343682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:13,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42797 samples/s/p 5:24:41 } +2024-07-25 19:44:16,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1409/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.9341829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.44355 samples/s/p 5:23:42 } +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1411/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.9339972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43318 samples/s/p 5:24:16 } +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1413/ 1625], loss: 1.118, per_step_time: 1474ms, lr: 2.9338113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:22,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42400 samples/s/p 5:24:46 } +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1415/ 1625], loss: 1.077, per_step_time: 1474ms, lr: 2.9336252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42651 samples/s/p 5:24:34 } +2024-07-25 19:44:28,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1417/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9334386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43375 samples/s/p 5:24:05 } +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1419/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.933252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42932 samples/s/p 5:24:18 } +2024-07-25 19:44:34,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1421/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9330648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:34,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42665 samples/s/p 5:24:25 } +2024-07-25 19:44:37,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1423/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9328778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:37,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43343 samples/s/p 5:23:58 } +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1425/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 2.9326904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:40,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43021 samples/s/p 5:24:06 } +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1427/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 2.9325025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:43,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43516 samples/s/p 5:23:46 } +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1429/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 2.9323146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.42436 samples/s/p 5:24:21 } +2024-07-25 19:44:49,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1431/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.9321263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:49,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43714 samples/s/p 5:23:33 } +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1433/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.9319379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43616 samples/s/p 5:23:33 } +2024-07-25 19:44:55,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1435/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.931749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:55,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43758 samples/s/p 5:23:25 } +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1437/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.9315599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43559 samples/s/p 5:23:29 } +2024-07-25 19:45:01,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1439/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.931371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43755 samples/s/p 5:23:19 } +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1441/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:04,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42960 samples/s/p 5:23:45 } +2024-07-25 19:45:06,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1443/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 2.9309916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:06,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42058 samples/s/p 5:24:14 } +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1445/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.9308016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43377 samples/s/p 5:23:24 } +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1447/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.9306113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43567 samples/s/p 5:23:14 } +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1449/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.9304209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43369 samples/s/p 5:23:18 } +2024-07-25 19:45:18,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1451/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.93023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:18,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43722 samples/s/p 5:23:03 } +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1453/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.930039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43001 samples/s/p 5:23:26 } +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1455/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9298477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43446 samples/s/p 5:23:07 } +2024-07-25 19:45:27,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1457/ 1625], loss: 1.217, per_step_time: 1474ms, lr: 2.9296561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:27,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42475 samples/s/p 5:23:39 } +2024-07-25 19:45:30,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1459/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 2.9294642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:30,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43990 samples/s/p 5:22:42 } +2024-07-25 19:45:33,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1461/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.9292723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:33,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42641 samples/s/p 5:23:27 } +2024-07-25 19:45:36,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1463/ 1625], loss: 1.388, per_step_time: 1474ms, lr: 2.9290799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:36,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42400 samples/s/p 5:23:32 } +2024-07-25 19:45:39,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1465/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.9288873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42860 samples/s/p 5:23:13 } +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1467/ 1625], loss: 1.293, per_step_time: 1470ms, lr: 2.9286944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43882 samples/s/p 5:22:34 } +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1469/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.9285015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:45,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43285 samples/s/p 5:22:52 } +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1471/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.9283083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43525 samples/s/p 5:22:41 } +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1473/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 2.9281146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43942 samples/s/p 5:22:23 } +2024-07-25 19:45:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1475/ 1625], loss: 1.410, per_step_time: 1472ms, lr: 2.9279207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43425 samples/s/p 5:22:38 } +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1477/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.9277267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43178 samples/s/p 5:22:44 } +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1479/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9275321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:00,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43067 samples/s/p 5:22:45 } +2024-07-25 19:46:03,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1481/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 2.9273377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:03,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43261 samples/s/p 5:22:35 } +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1483/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9271429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43730 samples/s/p 5:22:16 } +2024-07-25 19:46:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1485/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9269479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:08,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43176 samples/s/p 5:22:32 } +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1487/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.9267525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43800 samples/s/p 5:22:07 } +2024-07-25 19:46:14,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1489/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.9265568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:14,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42840 samples/s/p 5:22:38 } +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1491/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.9263609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43382 samples/s/p 5:22:16 } +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.926165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43314 samples/s/p 5:22:16 } +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1495/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.9259685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42976 samples/s/p 5:22:25 } +2024-07-25 19:46:26,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1497/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9257719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:26,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42812 samples/s/p 5:22:28 } +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1499/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.9255749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43373 samples/s/p 5:22:05 } +2024-07-25 19:46:32,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1501/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.9253777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:32,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43204 samples/s/p 5:22:08 } +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1503/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.9251803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43859 samples/s/p 5:21:42 } +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1505/ 1625], loss: 1.197, per_step_time: 1474ms, lr: 2.9249826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42433 samples/s/p 5:22:29 } +2024-07-25 19:46:41,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1507/ 1625], loss: 0.925, per_step_time: 1474ms, lr: 2.9247849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:41,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42494 samples/s/p 5:22:24 } +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1509/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9245868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43791 samples/s/p 5:21:35 } +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1511/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9243884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43068 samples/s/p 5:21:58 } +2024-07-25 19:46:50,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1513/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.9241895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:50,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42871 samples/s/p 5:22:02 } +2024-07-25 19:46:53,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1515/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9239907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:53,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43266 samples/s/p 5:21:45 } +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1517/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9237914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43628 samples/s/p 5:21:29 } +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1519/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.923592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43243 samples/s/p 5:21:40 } +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1521/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9233923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43478 samples/s/p 5:21:29 } +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1523/ 1625], loss: 1.392, per_step_time: 1471ms, lr: 2.9231926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43633 samples/s/p 5:21:20 } +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1525/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9229921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43249 samples/s/p 5:21:31 } +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1527/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9227918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43699 samples/s/p 5:21:12 } +2024-07-25 19:47:13,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1529/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.922591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43645 samples/s/p 5:21:11 } +2024-07-25 19:47:16,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1531/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.92239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:16,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43666 samples/s/p 5:21:07 } +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1533/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.922189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43032 samples/s/p 5:21:27 } +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1535/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 2.9219877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.42936 samples/s/p 5:21:27 } +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1537/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9217857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42886 samples/s/p 5:21:26 } +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1539/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9215838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43539 samples/s/p 5:21:00 } +2024-07-25 19:47:31,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1541/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 2.9213817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:31,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43235 samples/s/p 5:21:08 } +2024-07-25 19:47:34,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1543/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.9211793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:34,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42962 samples/s/p 5:21:15 } +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1545/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9209765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:37,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43372 samples/s/p 5:20:57 } +2024-07-25 19:47:40,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1547/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.9207737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:40,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42789 samples/s/p 5:21:15 } +2024-07-25 19:47:43,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1549/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.9205703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:43,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43137 samples/s/p 5:20:59 } +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1551/ 1625], loss: 1.156, per_step_time: 1474ms, lr: 2.9203668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42566 samples/s/p 5:21:17 } +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1553/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.920163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.42857 samples/s/p 5:21:03 } +2024-07-25 19:47:52,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1555/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9199591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:52,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43241 samples/s/p 5:20:47 } +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1557/ 1625], loss: 1.030, per_step_time: 1473ms, lr: 2.9197548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43103 samples/s/p 5:20:49 } +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1559/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9195504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43292 samples/s/p 5:20:39 } +2024-07-25 19:48:01,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1561/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.9193456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:01,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43386 samples/s/p 5:20:33 } +2024-07-25 19:48:04,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1563/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.9191406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:04,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43723 samples/s/p 5:20:18 } +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1565/ 1625], loss: 1.333, per_step_time: 1486ms, lr: 2.9189354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.38342 samples/s/p 5:23:27 } +2024-07-25 19:48:10,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1567/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.9187298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43927 samples/s/p 5:20:05 } +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1569/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.9185241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43941 samples/s/p 5:20:02 } +2024-07-25 19:48:15,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1571/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.9183184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:15,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42952 samples/s/p 5:20:34 } +2024-07-25 19:48:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1573/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.918112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:18,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43828 samples/s/p 5:20:00 } +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1575/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.9179055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43377 samples/s/p 5:20:13 } +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1577/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9176985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43158 samples/s/p 5:20:17 } +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1579/ 1625], loss: 1.100, per_step_time: 1478ms, lr: 2.9174918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:27,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.41035 samples/s/p 5:21:30 } +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1581/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 2.9172843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42298 samples/s/p 5:20:42 } +2024-07-25 19:48:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1583/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.917077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43378 samples/s/p 5:20:01 } +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1585/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9168692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.42988 samples/s/p 5:20:12 } +2024-07-25 19:48:39,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1587/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.9166611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43953 samples/s/p 5:19:35 } +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1589/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.916453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:42,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43206 samples/s/p 5:19:58 } +2024-07-25 19:48:45,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1591/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.9162444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:45,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43727 samples/s/p 5:19:37 } +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1593/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.9160356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43323 samples/s/p 5:19:48 } +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1595/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.9158266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.44076 samples/s/p 5:19:19 } +2024-07-25 19:48:54,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1597/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.915617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:54,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43467 samples/s/p 5:19:37 } +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1599/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9154075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43631 samples/s/p 5:19:28 } +2024-07-25 19:49:00,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1601/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.9151977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:00,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42554 samples/s/p 5:20:04 } +2024-07-25 19:49:03,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1603/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 2.9149878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:03,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43132 samples/s/p 5:19:40 } +2024-07-25 19:49:06,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1605/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 2.9147775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:06,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43227 samples/s/p 5:19:34 } +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1607/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.9145669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43281 samples/s/p 5:19:29 } +2024-07-25 19:49:12,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1609/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.914356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:12,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42575 samples/s/p 5:19:51 } +2024-07-25 19:49:15,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1611/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.914145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:15,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43477 samples/s/p 5:19:16 } +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1613/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9139337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43143 samples/s/p 5:19:25 } +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1615/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.9137222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43668 samples/s/p 5:19:04 } +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1617/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 2.9135103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.44195 samples/s/p 5:18:42 } +2024-07-25 19:49:26,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1619/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9132983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:26,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.42868 samples/s/p 5:19:26 } +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1621/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.913086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43929 samples/s/p 5:18:46 } +2024-07-25 19:49:32,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1623/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9128734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:32,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43396 samples/s/p 5:19:01 } +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1625/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 2.9126608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:35,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42576 samples/s/p 5:19:27 } +2024-07-25 19:49:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 2/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 2.9124476e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42165 samples/s/p 5:19:39 } +2024-07-25 19:49:41,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 4/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.9122342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:41,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43120 samples/s/p 5:19:02 } +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 6/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 2.9120209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42905 samples/s/p 5:19:07 } +2024-07-25 19:49:47,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 8/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.911807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:47,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43196 samples/s/p 5:18:54 } +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 10/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.911593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43171 samples/s/p 5:18:52 } +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 12/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9113786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43350 samples/s/p 5:18:42 } +2024-07-25 19:49:56,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 14/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.911164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:56,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43810 samples/s/p 5:18:23 } +2024-07-25 19:49:59,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 16/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.9109493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:59,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43002 samples/s/p 5:18:49 } +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 18/ 1625], loss: 1.293, per_step_time: 1470ms, lr: 2.9107341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43955 samples/s/p 5:18:12 } +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 20/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.910519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43321 samples/s/p 5:18:32 } +2024-07-25 19:50:08,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 22/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.9103032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:08,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42747 samples/s/p 5:18:49 } +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.9100875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43414 samples/s/p 5:18:22 } +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 26/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.9098714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43345 samples/s/p 5:18:22 } +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 28/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.9096549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:17,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43974 samples/s/p 5:17:57 } +2024-07-25 19:50:19,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 30/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.9094384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:19,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43279 samples/s/p 5:18:18 } +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 32/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 2.9092214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:22,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42412 samples/s/p 5:18:46 } +2024-07-25 19:50:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 34/ 1625], loss: 1.247, per_step_time: 1474ms, lr: 2.9090043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42564 samples/s/p 5:18:38 } +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 36/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 2.9087872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43978 samples/s/p 5:17:45 } +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 38/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.9085697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43501 samples/s/p 5:17:59 } +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 40/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9083518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43208 samples/s/p 5:18:06 } +2024-07-25 19:50:37,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 42/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.9081337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:37,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43412 samples/s/p 5:17:56 } +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 44/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 2.9079154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43320 samples/s/p 5:17:56 } +2024-07-25 19:50:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 46/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.9076968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:43,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44057 samples/s/p 5:17:27 } +2024-07-25 19:50:46,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 48/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9074781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:46,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43144 samples/s/p 5:17:57 } +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 50/ 1625], loss: 1.345, per_step_time: 1470ms, lr: 2.907259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44163 samples/s/p 5:17:18 } +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 52/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9070396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43060 samples/s/p 5:17:54 } +2024-07-25 19:50:55,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 54/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9068198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43602 samples/s/p 5:17:32 } +2024-07-25 19:50:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 56/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.9066001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43331 samples/s/p 5:17:38 } +2024-07-25 19:51:01,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 58/ 1625], loss: 1.227, per_step_time: 1474ms, lr: 2.9063798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:01,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42565 samples/s/p 5:18:02 } +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 60/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9061597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43310 samples/s/p 5:17:33 } +2024-07-25 19:51:07,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 62/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9059389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:07,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42526 samples/s/p 5:17:58 } +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 64/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 2.9057182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42942 samples/s/p 5:17:40 } +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 66/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 2.905497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43104 samples/s/p 5:17:31 } +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 68/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9052757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43150 samples/s/p 5:17:27 } +2024-07-25 19:51:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 70/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.9050541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43548 samples/s/p 5:17:10 } +2024-07-25 19:51:21,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 72/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9048324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:21,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43425 samples/s/p 5:17:11 } +2024-07-25 19:51:24,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 74/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.9046103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:24,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43142 samples/s/p 5:17:18 } +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 76/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9043878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43329 samples/s/p 5:17:09 } +2024-07-25 19:51:30,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 78/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.9041654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:30,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43560 samples/s/p 5:16:58 } +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 80/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.9039425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42978 samples/s/p 5:17:15 } +2024-07-25 19:51:36,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 82/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9037194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:36,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43154 samples/s/p 5:17:06 } +2024-07-25 19:51:39,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 84/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 2.903496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:39,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42611 samples/s/p 5:17:22 } +2024-07-25 19:51:42,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 86/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 2.9032724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:42,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42241 samples/s/p 5:17:32 } +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 88/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.9030487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43637 samples/s/p 5:16:40 } +2024-07-25 19:51:48,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 90/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9028244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:48,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43293 samples/s/p 5:16:49 } +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 92/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.9026001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43652 samples/s/p 5:16:34 } +2024-07-25 19:51:54,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 94/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.9023757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:54,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43408 samples/s/p 5:16:40 } +2024-07-25 19:51:57,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 96/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9021508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:57,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43559 samples/s/p 5:16:31 } +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 98/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9019258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43744 samples/s/p 5:16:22 } +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 100/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9017005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.42918 samples/s/p 5:16:48 } +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 102/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.9014749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43710 samples/s/p 5:16:17 } +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 104/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.9012492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43348 samples/s/p 5:16:27 } +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 106/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.901023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43437 samples/s/p 5:16:21 } +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 108/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.9007966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43509 samples/s/p 5:16:15 } +2024-07-25 19:52:18,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 110/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.90057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:18,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43601 samples/s/p 5:16:09 } +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 112/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.900343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42841 samples/s/p 5:16:33 } +2024-07-25 19:52:23,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 114/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.900116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:23,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43168 samples/s/p 5:16:19 } +2024-07-25 19:52:26,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 116/ 1625], loss: 1.367, per_step_time: 1470ms, lr: 2.8998888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:26,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.44086 samples/s/p 5:15:44 } +2024-07-25 19:52:29,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 118/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.899661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43431 samples/s/p 5:16:03 } +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 120/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8994333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42870 samples/s/p 5:16:20 } +2024-07-25 19:52:35,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 122/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.8992054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:35,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43227 samples/s/p 5:16:05 } +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 124/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 2.898977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43788 samples/s/p 5:15:42 } +2024-07-25 19:52:41,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 126/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.8987482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:41,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43375 samples/s/p 5:15:54 } +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 128/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8985194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43268 samples/s/p 5:15:54 } +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 130/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.8982906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43053 samples/s/p 5:15:59 } +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 132/ 1625], loss: 1.306, per_step_time: 1474ms, lr: 2.8980612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42423 samples/s/p 5:16:18 } +2024-07-25 19:52:53,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 134/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.8978317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:53,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43094 samples/s/p 5:15:52 } +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 136/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.8976017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42966 samples/s/p 5:15:53 } +2024-07-25 19:52:59,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 138/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.8973716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:59,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43863 samples/s/p 5:15:19 } +2024-07-25 19:53:02,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 140/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.8971413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:02,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43058 samples/s/p 5:15:44 } +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 142/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8969109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43288 samples/s/p 5:15:33 } +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 144/ 1625], loss: 1.292, per_step_time: 1473ms, lr: 2.89668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42959 samples/s/p 5:15:42 } +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 146/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8964489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43515 samples/s/p 5:15:19 } +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 148/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8962177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43358 samples/s/p 5:15:22 } +2024-07-25 19:53:17,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 150/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8959861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43194 samples/s/p 5:15:25 } +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 152/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.895754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42868 samples/s/p 5:15:33 } +2024-07-25 19:53:23,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 154/ 1625], loss: 1.245, per_step_time: 1475ms, lr: 2.895522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42289 samples/s/p 5:15:50 } +2024-07-25 19:53:25,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 156/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.8952898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:25,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.44039 samples/s/p 5:14:46 } +2024-07-25 19:53:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 158/ 1625], loss: 1.305, per_step_time: 1473ms, lr: 2.8950573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:28,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43086 samples/s/p 5:15:17 } +2024-07-25 19:53:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 160/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.8948245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42559 samples/s/p 5:15:32 } +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 162/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.8945915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:34,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.44077 samples/s/p 5:14:36 } +2024-07-25 19:53:37,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 164/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.8943581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:37,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43269 samples/s/p 5:15:01 } +2024-07-25 19:53:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 166/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.8941244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43667 samples/s/p 5:14:45 } +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 168/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8938906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43559 samples/s/p 5:14:45 } +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 170/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.8936567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43185 samples/s/p 5:14:55 } +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 172/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 2.8934224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42465 samples/s/p 5:15:18 } +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 174/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.893188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43571 samples/s/p 5:14:36 } +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 176/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8929531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43406 samples/s/p 5:14:39 } +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 178/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.8927181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43359 samples/s/p 5:14:38 } +2024-07-25 19:54:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 180/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.892483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42928 samples/s/p 5:14:50 } +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 182/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.8922472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43009 samples/s/p 5:14:44 } +2024-07-25 19:54:07,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.8920114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:07,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43308 samples/s/p 5:14:31 } +2024-07-25 19:54:10,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 186/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.8917755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43434 samples/s/p 5:14:23 } +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 188/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.8915392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43770 samples/s/p 5:14:09 } +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 190/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.8913028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:16,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.44199 samples/s/p 5:13:51 } +2024-07-25 19:54:19,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 192/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.891066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:19,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43230 samples/s/p 5:14:21 } +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 194/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.890829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43623 samples/s/p 5:14:05 } +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 196/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.8905917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43934 samples/s/p 5:13:51 } +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 198/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8903542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43797 samples/s/p 5:13:53 } +2024-07-25 19:54:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 200/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 2.8901162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43484 samples/s/p 5:14:01 } +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 202/ 1625], loss: 0.911, per_step_time: 1472ms, lr: 2.8898783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43208 samples/s/p 5:14:08 } +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 204/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.8896402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43158 samples/s/p 5:14:06 } +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 206/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.8894017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42886 samples/s/p 5:14:13 } +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 208/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 2.8891629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43866 samples/s/p 5:13:36 } +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 210/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 2.8889239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42661 samples/s/p 5:14:15 } +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 212/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.8886847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43610 samples/s/p 5:13:39 } +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 214/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 2.8884451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:51,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42587 samples/s/p 5:14:11 } +2024-07-25 19:54:54,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 216/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.8882056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43781 samples/s/p 5:13:27 } +2024-07-25 19:54:57,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 218/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 2.8879656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:57,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43340 samples/s/p 5:13:39 } +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 220/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.8877253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43632 samples/s/p 5:13:26 } +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 222/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8874847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43264 samples/s/p 5:13:36 } +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 224/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.8872442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:06,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42776 samples/s/p 5:13:50 } +2024-07-25 19:55:09,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 226/ 1625], loss: 1.336, per_step_time: 1474ms, lr: 2.8870032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:09,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42613 samples/s/p 5:13:53 } +2024-07-25 19:55:12,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 228/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8867618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:12,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43366 samples/s/p 5:13:24 } +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 230/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8865205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43242 samples/s/p 5:13:25 } +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 232/ 1625], loss: 1.200, per_step_time: 1474ms, lr: 2.8862785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:18,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42728 samples/s/p 5:13:40 } +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 234/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.8860366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:21,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42769 samples/s/p 5:13:36 } +2024-07-25 19:55:24,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 236/ 1625], loss: 1.114, per_step_time: 1475ms, lr: 2.8857945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:24,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.42370 samples/s/p 5:13:47 } +2024-07-25 19:55:27,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 238/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.8855518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:27,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43300 samples/s/p 5:13:11 } +2024-07-25 19:55:29,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 240/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.8853092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43317 samples/s/p 5:13:08 } +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 242/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.8850664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43609 samples/s/p 5:12:55 } +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 244/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 2.8848232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43481 samples/s/p 5:12:56 } +2024-07-25 19:55:38,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 246/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 2.8845798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:38,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43901 samples/s/p 5:12:39 } +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 248/ 1625], loss: 1.535, per_step_time: 1470ms, lr: 2.884336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43913 samples/s/p 5:12:35 } +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 250/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.884092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43355 samples/s/p 5:12:52 } +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 252/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.883848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43304 samples/s/p 5:12:51 } +2024-07-25 19:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 254/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8836035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43756 samples/s/p 5:12:32 } +2024-07-25 19:55:53,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 256/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.8833589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43762 samples/s/p 5:12:29 } +2024-07-25 19:55:56,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 258/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 2.883114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:56,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43586 samples/s/p 5:12:32 } +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 260/ 1625], loss: 1.411, per_step_time: 1474ms, lr: 2.8828688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42662 samples/s/p 5:13:01 } +2024-07-25 19:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 262/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 2.8826234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:02,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43257 samples/s/p 5:12:37 } +2024-07-25 19:56:05,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 264/ 1625], loss: 1.197, per_step_time: 1474ms, lr: 2.8823779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:05,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42601 samples/s/p 5:12:57 } +2024-07-25 19:56:08,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 266/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.8821318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42946 samples/s/p 5:12:42 } +2024-07-25 19:56:11,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 268/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.8818857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:11,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43926 samples/s/p 5:12:06 } +2024-07-25 19:56:14,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 270/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.8816394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:14,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43793 samples/s/p 5:12:07 } +2024-07-25 19:56:17,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 272/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.8813927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:17,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43444 samples/s/p 5:12:16 } +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 274/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8811459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43448 samples/s/p 5:12:13 } +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 276/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 2.8808987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42704 samples/s/p 5:12:36 } +2024-07-25 19:56:26,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 278/ 1625], loss: 1.214, per_step_time: 1474ms, lr: 2.8806513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:26,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42672 samples/s/p 5:12:34 } +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 280/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.8804037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:29,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43577 samples/s/p 5:12:00 } +2024-07-25 19:56:31,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 282/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.8801558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42909 samples/s/p 5:12:20 } +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 284/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.8799077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:34,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43700 samples/s/p 5:11:50 } +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 286/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.8796594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43746 samples/s/p 5:11:45 } +2024-07-25 19:56:40,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 288/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.8794107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:40,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43769 samples/s/p 5:11:42 } +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 290/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.879162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:43,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43539 samples/s/p 5:11:47 } +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 292/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.8789127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43563 samples/s/p 5:11:43 } +2024-07-25 19:56:49,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 294/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.8786633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:49,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43545 samples/s/p 5:11:40 } +2024-07-25 19:56:52,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 296/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8784138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:52,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43597 samples/s/p 5:11:36 } +2024-07-25 19:56:55,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 298/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8781642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:55,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43309 samples/s/p 5:11:43 } +2024-07-25 19:56:58,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 300/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8779139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:58,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43900 samples/s/p 5:11:19 } +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 302/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 2.8776638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43749 samples/s/p 5:11:22 } +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 304/ 1625], loss: 1.081, per_step_time: 1474ms, lr: 2.8774133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42736 samples/s/p 5:11:54 } +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 306/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.8771623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43169 samples/s/p 5:11:36 } +2024-07-25 19:57:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 308/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.8769113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43769 samples/s/p 5:11:12 } +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 310/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.87666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42777 samples/s/p 5:11:43 } +2024-07-25 19:57:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 312/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 2.8764085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:16,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43239 samples/s/p 5:11:24 } +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 314/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 2.8761566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42432 samples/s/p 5:11:49 } +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 316/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.8759046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43363 samples/s/p 5:11:14 } +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 318/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8756524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43374 samples/s/p 5:11:11 } +2024-07-25 19:57:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 320/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.8753999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:28,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43578 samples/s/p 5:11:01 } +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 322/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.875147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:31,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43210 samples/s/p 5:11:11 } +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 324/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8748942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43078 samples/s/p 5:11:12 } +2024-07-25 19:57:36,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 326/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 2.8746406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43925 samples/s/p 5:10:40 } +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 328/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.8743872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43228 samples/s/p 5:11:01 } +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 330/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8741335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43329 samples/s/p 5:10:55 } +2024-07-25 19:57:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 332/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.8738794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:45,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43754 samples/s/p 5:10:37 } +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 334/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.8736255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43372 samples/s/p 5:10:48 } +2024-07-25 19:57:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 336/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.8733708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:51,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43183 samples/s/p 5:10:51 } +2024-07-25 19:57:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 338/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8731161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:54,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43316 samples/s/p 5:10:44 } +2024-07-25 19:57:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 340/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.8728611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:57,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43100 samples/s/p 5:10:48 } +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 342/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.872606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43737 samples/s/p 5:10:23 } +2024-07-25 19:58:03,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 344/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8723503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:03,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.42979 samples/s/p 5:10:46 } +2024-07-25 19:58:06,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 346/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.8720948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:06,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43111 samples/s/p 5:10:39 } +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 348/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.871839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43021 samples/s/p 5:10:39 } +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 350/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.8715825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:12,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.44007 samples/s/p 5:10:02 } +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 352/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8713264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43228 samples/s/p 5:10:26 } +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 354/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.8710696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43706 samples/s/p 5:10:07 } +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 356/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.8708128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43228 samples/s/p 5:10:20 } +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 358/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.8705555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43332 samples/s/p 5:10:14 } +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 360/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.8702983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:27,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43808 samples/s/p 5:09:54 } +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 362/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8700404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43753 samples/s/p 5:09:53 } +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 364/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.8697825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43989 samples/s/p 5:09:42 } +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 366/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.8695245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43643 samples/s/p 5:09:51 } +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 368/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.869266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43643 samples/s/p 5:09:48 } +2024-07-25 19:58:41,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 370/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.8690074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:41,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42904 samples/s/p 5:10:11 } +2024-07-25 19:58:44,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 372/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.8687486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:44,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43233 samples/s/p 5:09:56 } +2024-07-25 19:58:47,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 374/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.8684895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43818 samples/s/p 5:09:33 } +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 376/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 2.8682301e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43596 samples/s/p 5:09:38 } +2024-07-25 19:58:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 378/ 1625], loss: 1.099, per_step_time: 1475ms, lr: 2.8679706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42091 samples/s/p 5:10:27 } +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 380/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.8677106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43216 samples/s/p 5:09:45 } +2024-07-25 19:58:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 382/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.8674505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:59,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43545 samples/s/p 5:09:31 } +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 384/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 2.8671904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43004 samples/s/p 5:09:46 } +2024-07-25 19:59:05,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 386/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.8669298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:05,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43371 samples/s/p 5:09:31 } +2024-07-25 19:59:08,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 388/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 2.8666691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:08,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.42927 samples/s/p 5:09:43 } +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 390/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.866408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43504 samples/s/p 5:09:21 } +2024-07-25 19:59:14,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 392/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.8661465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:14,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.44063 samples/s/p 5:08:59 } +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 394/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.865885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43256 samples/s/p 5:09:23 } +2024-07-25 19:59:20,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 396/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8656234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:20,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43546 samples/s/p 5:09:10 } +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 398/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8653612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43417 samples/s/p 5:09:12 } +2024-07-25 19:59:26,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 400/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.865099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:26,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42979 samples/s/p 5:09:24 } +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 402/ 1625], loss: 0.941, per_step_time: 1470ms, lr: 2.8648365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.44006 samples/s/p 5:08:46 } +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 404/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8645738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43758 samples/s/p 5:08:51 } +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 406/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 2.8643106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43240 samples/s/p 5:09:06 } +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 408/ 1625], loss: 1.095, per_step_time: 1473ms, lr: 2.8640474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42745 samples/s/p 5:09:20 } +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 410/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.863784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43523 samples/s/p 5:08:50 } +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 412/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8635202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43443 samples/s/p 5:08:50 } +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 414/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.8632563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43123 samples/s/p 5:08:58 } +2024-07-25 19:59:49,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 416/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8629922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:49,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43765 samples/s/p 5:08:33 } +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 418/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.8627277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43400 samples/s/p 5:08:43 } +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 420/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.8624629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:55,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43799 samples/s/p 5:08:26 } +2024-07-25 19:59:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 422/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.862198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44019 samples/s/p 5:08:16 } +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 424/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.8619328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44058 samples/s/p 5:08:12 } +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 426/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.8616674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43542 samples/s/p 5:08:26 } +2024-07-25 20:00:07,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 428/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.8614015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:07,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44012 samples/s/p 5:08:07 } +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 430/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.8611357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43395 samples/s/p 5:08:25 } +2024-07-25 20:00:13,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 432/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.8608694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:13,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43692 samples/s/p 5:08:12 } +2024-07-25 20:00:16,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 434/ 1625], loss: 1.255, per_step_time: 1469ms, lr: 2.8606033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:16,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.44228 samples/s/p 5:07:51 } +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 436/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8603366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43376 samples/s/p 5:08:17 } +2024-07-25 20:00:22,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 438/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.8600698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:22,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43269 samples/s/p 5:08:18 } +2024-07-25 20:00:25,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 440/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.8598026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43816 samples/s/p 5:07:56 } +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 442/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8595354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43186 samples/s/p 5:08:15 } +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 444/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.8592678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43290 samples/s/p 5:08:08 } +2024-07-25 20:00:33,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 446/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.8589999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.42822 samples/s/p 5:08:21 } +2024-07-25 20:00:36,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 448/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.858732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:36,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43358 samples/s/p 5:08:00 } +2024-07-25 20:00:39,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 450/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.8584634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:39,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43494 samples/s/p 5:07:53 } +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 452/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.858195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:42,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42924 samples/s/p 5:08:09 } +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 454/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.8579261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.44000 samples/s/p 5:07:29 } +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 456/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.857657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42871 samples/s/p 5:08:05 } +2024-07-25 20:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.8573877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:51,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43047 samples/s/p 5:07:56 } +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 460/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.8571181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42795 samples/s/p 5:08:02 } +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 462/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.8568486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43488 samples/s/p 5:07:35 } +2024-07-25 20:01:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 464/ 1625], loss: 1.383, per_step_time: 1473ms, lr: 2.8565784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43054 samples/s/p 5:07:47 } +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 466/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.8563083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.44138 samples/s/p 5:07:07 } +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 468/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 2.8560375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43743 samples/s/p 5:07:18 } +2024-07-25 20:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.8557668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42868 samples/s/p 5:07:44 } +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 472/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.855496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43187 samples/s/p 5:07:31 } +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 474/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.8552247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43819 samples/s/p 5:07:06 } +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 476/ 1625], loss: 1.055, per_step_time: 1475ms, lr: 2.8549533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42365 samples/s/p 5:07:53 } +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 478/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8546816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43329 samples/s/p 5:07:17 } +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 480/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.8544096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43483 samples/s/p 5:07:09 } +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 482/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.8541375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43480 samples/s/p 5:07:06 } +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 484/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.853865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43654 samples/s/p 5:06:57 } +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 486/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.8535924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43546 samples/s/p 5:06:58 } +2024-07-25 20:01:35,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 488/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.8533195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:35,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43541 samples/s/p 5:06:55 } +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 490/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.8530465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43021 samples/s/p 5:07:10 } +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 492/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.8527731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43322 samples/s/p 5:06:57 } +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 494/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.8524992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43633 samples/s/p 5:06:43 } +2024-07-25 20:01:47,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 496/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.8522254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43407 samples/s/p 5:06:48 } +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 498/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.8519513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43545 samples/s/p 5:06:40 } +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 500/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.8516772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43713 samples/s/p 5:06:32 } +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 502/ 1625], loss: 1.412, per_step_time: 1474ms, lr: 2.8514025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.42570 samples/s/p 5:07:07 } +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 504/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.8511276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:59,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43552 samples/s/p 5:06:31 } +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 506/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.8508526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43184 samples/s/p 5:06:41 } +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 508/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8505772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.44076 samples/s/p 5:06:08 } +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 510/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.8503016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43228 samples/s/p 5:06:33 } +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 512/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.8500259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43616 samples/s/p 5:06:17 } +2024-07-25 20:02:14,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 514/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.8497498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.42844 samples/s/p 5:06:40 } +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 516/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.8494736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:17,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43668 samples/s/p 5:06:10 } +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 518/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.849197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43339 samples/s/p 5:06:18 } +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 520/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8489203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43713 samples/s/p 5:06:02 } +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 522/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.8486435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43065 samples/s/p 5:06:21 } +2024-07-25 20:02:29,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 524/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.848366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:29,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43970 samples/s/p 5:05:48 } +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 526/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.8480888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43576 samples/s/p 5:05:58 } +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 528/ 1625], loss: 1.487, per_step_time: 1470ms, lr: 2.8478109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43955 samples/s/p 5:05:42 } +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 530/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8475331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43123 samples/s/p 5:06:07 } +2024-07-25 20:02:40,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 532/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.8472548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43973 samples/s/p 5:05:36 } +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 534/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.8469765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43349 samples/s/p 5:05:54 } +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 536/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.8466979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:46,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43677 samples/s/p 5:05:40 } +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 538/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.846419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:49,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43750 samples/s/p 5:05:34 } +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 540/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.84614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43930 samples/s/p 5:05:25 } +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 542/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.8458602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43791 samples/s/p 5:05:27 } +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 544/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.845581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43706 samples/s/p 5:05:27 } +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 546/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.8453009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.42872 samples/s/p 5:05:52 } +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 548/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.845021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43997 samples/s/p 5:05:11 } +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 550/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.8447404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43543 samples/s/p 5:05:24 } +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 552/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 2.8444598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:10,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43241 samples/s/p 5:05:31 } +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 554/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.8441791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43584 samples/s/p 5:05:16 } +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 556/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.843898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43856 samples/s/p 5:05:04 } +2024-07-25 20:03:19,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 558/ 1625], loss: 1.013, per_step_time: 1469ms, lr: 2.8436167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:19,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.44320 samples/s/p 5:04:46 } +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 560/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 2.8433353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.42998 samples/s/p 5:05:27 } +2024-07-25 20:03:25,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 562/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.8430537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43133 samples/s/p 5:05:20 } +2024-07-25 20:03:28,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 564/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.8427714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:28,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43841 samples/s/p 5:04:53 } +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 566/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8424893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:31,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43891 samples/s/p 5:04:48 } +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 568/ 1625], loss: 1.203, per_step_time: 1476ms, lr: 2.8422068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.41743 samples/s/p 5:05:58 } +2024-07-25 20:03:36,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 570/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.8419241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:36,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43709 samples/s/p 5:04:49 } +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 572/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.841641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43801 samples/s/p 5:04:43 } +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 574/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.8413579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43323 samples/s/p 5:04:56 } +2024-07-25 20:03:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 576/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.8410743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43566 samples/s/p 5:04:45 } +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 578/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.8407909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43430 samples/s/p 5:04:46 } +2024-07-25 20:03:51,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 580/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.8405067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:51,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43483 samples/s/p 5:04:42 } +2024-07-25 20:03:54,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 582/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.8402226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:54,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43297 samples/s/p 5:04:45 } +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 584/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 2.8399383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.42475 samples/s/p 5:05:10 } +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 586/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8396536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:00,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43023 samples/s/p 5:04:48 } +2024-07-25 20:04:03,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 588/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8393688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:03,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43655 samples/s/p 5:04:24 } +2024-07-25 20:04:06,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 590/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.8390838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:06,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.44164 samples/s/p 5:04:04 } +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 592/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8387982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:09,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43759 samples/s/p 5:04:15 } +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 594/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.8385126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:12,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43839 samples/s/p 5:04:09 } +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 596/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.8382266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43508 samples/s/p 5:04:17 } +2024-07-25 20:04:18,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 598/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.8379409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:18,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43139 samples/s/p 5:04:27 } +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.8376546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:21,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43486 samples/s/p 5:04:12 } +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 602/ 1625], loss: 1.389, per_step_time: 1471ms, lr: 2.8373679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43588 samples/s/p 5:04:06 } +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 604/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.8370812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43853 samples/s/p 5:03:54 } +2024-07-25 20:04:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 606/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.8367942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:30,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.44137 samples/s/p 5:03:41 } +2024-07-25 20:04:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 608/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.836507e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:33,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43663 samples/s/p 5:03:54 } +2024-07-25 20:04:35,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 610/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 2.8362196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.44114 samples/s/p 5:03:36 } +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 612/ 1625], loss: 1.135, per_step_time: 1474ms, lr: 2.835932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42492 samples/s/p 5:04:28 } +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 614/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.8356437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42678 samples/s/p 5:04:19 } +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 616/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8353556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43454 samples/s/p 5:03:50 } +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 618/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.8350672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43853 samples/s/p 5:03:33 } +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 620/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.8347786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43699 samples/s/p 5:03:35 } +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 622/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.8344895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43775 samples/s/p 5:03:30 } +2024-07-25 20:04:56,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 624/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8342007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:56,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43966 samples/s/p 5:03:21 } +2024-07-25 20:04:59,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 626/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.8339113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:59,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43047 samples/s/p 5:03:48 } +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 628/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.8336215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43282 samples/s/p 5:03:38 } +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 630/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8333317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42922 samples/s/p 5:03:47 } +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 632/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 2.8330414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:08,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42805 samples/s/p 5:03:48 } +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 634/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 2.8327513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:11,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42925 samples/s/p 5:03:41 } +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 636/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.8324606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:14,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42927 samples/s/p 5:03:38 } +2024-07-25 20:05:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 638/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 2.83217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:17,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43591 samples/s/p 5:03:13 } +2024-07-25 20:05:20,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 640/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.831879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:20,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43467 samples/s/p 5:03:14 } +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 642/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.8315875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43809 samples/s/p 5:02:59 } +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 644/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 2.831296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:26,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42825 samples/s/p 5:03:29 } +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 646/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.8310042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43752 samples/s/p 5:02:55 } +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 648/ 1625], loss: 1.377, per_step_time: 1474ms, lr: 2.8307122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42661 samples/s/p 5:03:29 } +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 650/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.8304199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44184 samples/s/p 5:02:35 } +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 652/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.8301274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43741 samples/s/p 5:02:47 } +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 654/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.8298351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.42843 samples/s/p 5:03:14 } +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 656/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.829542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:43,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43759 samples/s/p 5:02:40 } +2024-07-25 20:05:46,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 658/ 1625], loss: 1.197, per_step_time: 1470ms, lr: 2.829249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:46,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44068 samples/s/p 5:02:27 } +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 660/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.8289556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43627 samples/s/p 5:02:39 } +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 662/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.828662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43577 samples/s/p 5:02:38 } +2024-07-25 20:05:55,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 664/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 2.8283679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:55,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43175 samples/s/p 5:02:48 } +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 666/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8280738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43006 samples/s/p 5:02:51 } +2024-07-25 20:06:01,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 668/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.8277795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:01,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43362 samples/s/p 5:02:36 } +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 670/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.827485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43921 samples/s/p 5:02:14 } +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 672/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.8271901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43708 samples/s/p 5:02:19 } +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 674/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.826895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43497 samples/s/p 5:02:23 } +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 676/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.8265997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.44057 samples/s/p 5:02:01 } +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 678/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.826304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43208 samples/s/p 5:02:27 } +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 680/ 1625], loss: 1.368, per_step_time: 1473ms, lr: 2.8260083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42876 samples/s/p 5:02:35 } +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 682/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.8257125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:22,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43435 samples/s/p 5:02:13 } +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 684/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.8254162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43518 samples/s/p 5:02:07 } +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 686/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.8251197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.44199 samples/s/p 5:01:42 } +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 688/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8248229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:31,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43162 samples/s/p 5:02:13 } +2024-07-25 20:06:34,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 690/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.824526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42923 samples/s/p 5:02:18 } +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 692/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.8242288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43311 samples/s/p 5:02:02 } +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 694/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.8239314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43137 samples/s/p 5:02:05 } +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 696/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.8236338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:42,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43587 samples/s/p 5:01:47 } +2024-07-25 20:06:45,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 698/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 2.823336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:45,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43054 samples/s/p 5:02:02 } +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 700/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.8230377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43376 samples/s/p 5:01:49 } +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 702/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.8227394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43296 samples/s/p 5:01:48 } +2024-07-25 20:06:54,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 704/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.8224411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:54,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.42976 samples/s/p 5:01:56 } +2024-07-25 20:06:57,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 706/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 2.822142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:57,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43654 samples/s/p 5:01:30 } +2024-07-25 20:07:00,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 708/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.8218434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42512 samples/s/p 5:02:06 } +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 710/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.821544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43027 samples/s/p 5:01:45 } +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.8212444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43485 samples/s/p 5:01:27 } +2024-07-25 20:07:09,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 714/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.8209444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:09,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43582 samples/s/p 5:01:21 } +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 716/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.8206448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43972 samples/s/p 5:01:05 } +2024-07-25 20:07:15,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 718/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.8203443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:15,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42642 samples/s/p 5:01:46 } +2024-07-25 20:07:18,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 720/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 2.8200438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:18,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43063 samples/s/p 5:01:29 } +2024-07-25 20:07:21,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 722/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.8197432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:21,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43810 samples/s/p 5:01:02 } +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 724/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8194423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:24,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43943 samples/s/p 5:00:54 } +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 726/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.819141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43561 samples/s/p 5:01:04 } +2024-07-25 20:07:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 728/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8188399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:30,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43018 samples/s/p 5:01:19 } +2024-07-25 20:07:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 730/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.818538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43083 samples/s/p 5:01:14 } +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 732/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8182361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43597 samples/s/p 5:00:54 } +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 734/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.817934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43289 samples/s/p 5:01:01 } +2024-07-25 20:07:41,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 736/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 2.8176317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:41,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43554 samples/s/p 5:00:50 } +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 738/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.817329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43357 samples/s/p 5:00:53 } +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 740/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.8170265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43841 samples/s/p 5:00:34 } +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 742/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.8167233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43650 samples/s/p 5:00:38 } +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 744/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.8164202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43498 samples/s/p 5:00:40 } +2024-07-25 20:07:56,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 746/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.8161166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:56,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43686 samples/s/p 5:00:31 } +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 748/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.8158129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43188 samples/s/p 5:00:44 } +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 750/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 2.815509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43872 samples/s/p 5:00:18 } +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 752/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.8152048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.42961 samples/s/p 5:00:46 } +2024-07-25 20:08:08,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 754/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 2.8149003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43886 samples/s/p 5:00:12 } +2024-07-25 20:08:11,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 756/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.8145956e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:11,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43510 samples/s/p 5:00:22 } +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 758/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 2.8142907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43728 samples/s/p 5:00:11 } +2024-07-25 20:08:17,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 760/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.8139855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:17,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43008 samples/s/p 5:00:32 } +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 762/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.8136801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43770 samples/s/p 5:00:04 } +2024-07-25 20:08:23,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 764/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 2.8133745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:23,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43042 samples/s/p 5:00:25 } +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 766/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.8130687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43813 samples/s/p 4:59:57 } +2024-07-25 20:08:29,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 768/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.8127626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43220 samples/s/p 5:00:14 } +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 770/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.8124563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43217 samples/s/p 5:00:11 } +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 772/ 1625], loss: 1.004, per_step_time: 1470ms, lr: 2.8121498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43920 samples/s/p 4:59:44 } +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 774/ 1625], loss: 1.152, per_step_time: 1469ms, lr: 2.8118431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44256 samples/s/p 4:59:30 } +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 776/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.811536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:40,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43920 samples/s/p 4:59:39 } +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 778/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 2.8112287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43963 samples/s/p 4:59:34 } +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 780/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.8109214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43955 samples/s/p 4:59:32 } +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 782/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.8106135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.42974 samples/s/p 5:00:01 } +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 784/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8103057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43233 samples/s/p 4:59:50 } +2024-07-25 20:08:55,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 786/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.8099974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:55,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44562 samples/s/p 4:59:03 } +2024-07-25 20:08:58,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 788/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.8096889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:58,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43421 samples/s/p 4:59:37 } +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 790/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.8093804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43934 samples/s/p 4:59:18 } +2024-07-25 20:09:04,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 792/ 1625], loss: 1.290, per_step_time: 1471ms, lr: 2.8090715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:04,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43560 samples/s/p 4:59:27 } +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 794/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 2.8087625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:07,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43924 samples/s/p 4:59:12 } +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 796/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.8084534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:10,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43303 samples/s/p 4:59:30 } +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 798/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.8081437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.42995 samples/s/p 4:59:37 } +2024-07-25 20:09:16,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 800/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8078339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:16,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43954 samples/s/p 4:59:02 } +2024-07-25 20:09:19,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 802/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.8075237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:19,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43127 samples/s/p 4:59:27 } +2024-07-25 20:09:22,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 804/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.8072136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43075 samples/s/p 4:59:25 } +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 806/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.8069033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43364 samples/s/p 4:59:13 } +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 808/ 1625], loss: 1.130, per_step_time: 1469ms, lr: 2.8065924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44277 samples/s/p 4:58:40 } +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 810/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.8062814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43223 samples/s/p 4:59:12 } +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 812/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.8059701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43844 samples/s/p 4:58:48 } +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 814/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 2.8056587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:36,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43622 samples/s/p 4:58:53 } +2024-07-25 20:09:39,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 816/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.8053471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:39,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43806 samples/s/p 4:58:44 } +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.8050354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43049 samples/s/p 4:59:06 } +2024-07-25 20:09:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 820/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8047232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44101 samples/s/p 4:58:28 } +2024-07-25 20:09:48,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 822/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.8044109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:48,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42701 samples/s/p 4:59:11 } +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 824/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.8040982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43371 samples/s/p 4:58:46 } +2024-07-25 20:09:54,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 826/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.8037857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43521 samples/s/p 4:58:38 } +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 828/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 2.8034725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43975 samples/s/p 4:58:20 } +2024-07-25 20:10:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 830/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.8031593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42811 samples/s/p 4:58:56 } +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 832/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.8028457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43772 samples/s/p 4:58:21 } +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 834/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.802532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:06,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43971 samples/s/p 4:58:12 } +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 836/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.8022181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43343 samples/s/p 4:58:29 } +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 838/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 2.8019038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42686 samples/s/p 4:58:48 } +2024-07-25 20:10:15,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 840/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.8015895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:15,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43765 samples/s/p 4:58:10 } +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 842/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.8012748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43536 samples/s/p 4:58:14 } +2024-07-25 20:10:21,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 844/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 2.80096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:21,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44299 samples/s/p 4:57:46 } +2024-07-25 20:10:24,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 846/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.8006447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:24,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43181 samples/s/p 4:58:20 } +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 848/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.8003293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43518 samples/s/p 4:58:06 } +2024-07-25 20:10:30,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 850/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.8000139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:30,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43227 samples/s/p 4:58:13 } +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 852/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 2.799698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44326 samples/s/p 4:57:34 } +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 854/ 1625], loss: 1.300, per_step_time: 1470ms, lr: 2.7993821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43986 samples/s/p 4:57:42 } +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 856/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.7990658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43417 samples/s/p 4:57:57 } +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 858/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.7987491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43498 samples/s/p 4:57:52 } +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 860/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7984324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43265 samples/s/p 4:57:57 } +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 862/ 1625], loss: 1.279, per_step_time: 1469ms, lr: 2.7981154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44244 samples/s/p 4:57:21 } +2024-07-25 20:10:50,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 864/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.7977982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43280 samples/s/p 4:57:50 } +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 866/ 1625], loss: 0.923, per_step_time: 1470ms, lr: 2.7974807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44037 samples/s/p 4:57:22 } +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 868/ 1625], loss: 1.200, per_step_time: 1474ms, lr: 2.7971631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.42735 samples/s/p 4:58:02 } +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 870/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.7968452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43162 samples/s/p 4:57:45 } +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 872/ 1625], loss: 1.453, per_step_time: 1471ms, lr: 2.7965272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43483 samples/s/p 4:57:32 } +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 874/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7962087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43244 samples/s/p 4:57:37 } +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 876/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.7958902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43353 samples/s/p 4:57:30 } +2024-07-25 20:11:11,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 878/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 2.7955713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:11,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43158 samples/s/p 4:57:34 } +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 880/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7952523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43550 samples/s/p 4:57:18 } +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 882/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.794933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43665 samples/s/p 4:57:11 } +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 884/ 1625], loss: 1.304, per_step_time: 1476ms, lr: 2.7946136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.41717 samples/s/p 4:58:12 } +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 886/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.7942939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43791 samples/s/p 4:57:01 } +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 888/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.7939739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.42922 samples/s/p 4:57:27 } +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 890/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7936538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:29,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43431 samples/s/p 4:57:07 } +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 892/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7933336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43339 samples/s/p 4:57:07 } +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 894/ 1625], loss: 1.138, per_step_time: 1469ms, lr: 2.7930128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.44248 samples/s/p 4:56:34 } +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 896/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.7926919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43229 samples/s/p 4:57:05 } +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 898/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 2.7923708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43177 samples/s/p 4:57:04 } +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 900/ 1625], loss: 1.450, per_step_time: 1472ms, lr: 2.7920494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43410 samples/s/p 4:56:53 } +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7917278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43673 samples/s/p 4:56:41 } +2024-07-25 20:11:49,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 904/ 1625], loss: 1.411, per_step_time: 1472ms, lr: 2.791406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43321 samples/s/p 4:56:50 } +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 906/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 2.791084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43918 samples/s/p 4:56:27 } +2024-07-25 20:11:55,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 908/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 2.7907618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:55,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43803 samples/s/p 4:56:28 } +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 910/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.7904392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43894 samples/s/p 4:56:22 } +2024-07-25 20:12:01,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 912/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.7901167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:01,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.42868 samples/s/p 4:56:53 } +2024-07-25 20:12:04,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 914/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.7897937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:04,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43714 samples/s/p 4:56:22 } +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 916/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.7894706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43160 samples/s/p 4:56:38 } +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 918/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7891474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43257 samples/s/p 4:56:31 } +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 920/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.7888234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43865 samples/s/p 4:56:09 } +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 922/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7884998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43214 samples/s/p 4:56:27 } +2024-07-25 20:12:19,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 924/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.7881757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:19,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43790 samples/s/p 4:56:05 } +2024-07-25 20:12:22,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 926/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.7878514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43640 samples/s/p 4:56:07 } +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 928/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7875269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43568 samples/s/p 4:56:07 } +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 930/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 2.7872022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43794 samples/s/p 4:55:56 } +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 932/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.7868771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:31,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43564 samples/s/p 4:56:01 } +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 934/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.7865519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43983 samples/s/p 4:55:44 } +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 936/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.7862265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43832 samples/s/p 4:55:46 } +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 938/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.7859009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:39,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43345 samples/s/p 4:55:59 } +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 940/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.7855749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:42,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43800 samples/s/p 4:55:41 } +2024-07-25 20:12:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 942/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.7852488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:45,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43684 samples/s/p 4:55:42 } +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 944/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.7849223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:48,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43644 samples/s/p 4:55:41 } +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 946/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 2.7845957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43915 samples/s/p 4:55:29 } +2024-07-25 20:12:54,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 948/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.7842689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:54,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43177 samples/s/p 4:55:50 } +2024-07-25 20:12:57,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 950/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.7839418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43695 samples/s/p 4:55:30 } +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 952/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.7836148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43009 samples/s/p 4:55:49 } +2024-07-25 20:13:35,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 954/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.783287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:35,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43409 samples/s/p 4:55:33 } +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 956/ 1625], loss: 1.364, per_step_time: 1472ms, lr: 2.7829592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43300 samples/s/p 4:55:34 } +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 958/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.7826314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.44027 samples/s/p 4:55:07 } +2024-07-25 20:13:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 960/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 2.7823033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:44,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43437 samples/s/p 4:55:24 } +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 962/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.7819746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43947 samples/s/p 4:55:04 } +2024-07-25 20:13:50,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 964/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.7816463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:50,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43191 samples/s/p 4:55:26 } +2024-07-25 20:13:53,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 966/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.7813174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:53,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43668 samples/s/p 4:55:07 } +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 968/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.780988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43949 samples/s/p 4:54:55 } +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 970/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.7806589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43638 samples/s/p 4:55:02 } +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 972/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.7803293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:02,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43208 samples/s/p 4:55:14 } +2024-07-25 20:14:05,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 974/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7799997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:05,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43283 samples/s/p 4:55:08 } +2024-07-25 20:14:08,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 976/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.7796697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:08,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43255 samples/s/p 4:55:06 } +2024-07-25 20:14:11,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 978/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.7793394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43403 samples/s/p 4:54:58 } +2024-07-25 20:14:14,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 980/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.7790089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43663 samples/s/p 4:54:47 } +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 982/ 1625], loss: 0.806, per_step_time: 1471ms, lr: 2.7786784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43542 samples/s/p 4:54:48 } +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 984/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.7783473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43672 samples/s/p 4:54:41 } +2024-07-25 20:14:23,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 986/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 2.7780163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:23,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43981 samples/s/p 4:54:28 } +2024-07-25 20:14:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 988/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7776849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43836 samples/s/p 4:54:30 } +2024-07-25 20:14:29,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 990/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 2.7773533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:29,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43854 samples/s/p 4:54:26 } +2024-07-25 20:14:32,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 992/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.7770213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:32,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43080 samples/s/p 4:54:48 } +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 994/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7766893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43428 samples/s/p 4:54:34 } +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 996/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.7763572e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43484 samples/s/p 4:54:29 } +2024-07-25 20:14:40,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 998/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 2.7760247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:40,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43877 samples/s/p 4:54:13 } +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1000/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.7756918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43229 samples/s/p 4:54:32 } +2024-07-25 20:14:46,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1002/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.775359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:46,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43900 samples/s/p 4:54:07 } +2024-07-25 20:14:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1004/ 1625], loss: 1.410, per_step_time: 1470ms, lr: 2.775026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.44039 samples/s/p 4:53:59 } +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1006/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.7746924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43955 samples/s/p 4:53:59 } +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1008/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 2.7743588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.42769 samples/s/p 4:54:35 } +2024-07-25 20:14:58,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1010/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.774025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:58,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43906 samples/s/p 4:53:55 } +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1012/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.7736909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43213 samples/s/p 4:54:14 } +2024-07-25 20:15:04,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1014/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.7733566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:04,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43881 samples/s/p 4:53:50 } +2024-07-25 20:15:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1016/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.7730222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:07,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43136 samples/s/p 4:54:11 } +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1018/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.7726874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43373 samples/s/p 4:54:00 } +2024-07-25 20:15:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1020/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.7723525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:13,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43918 samples/s/p 4:53:40 } +2024-07-25 20:15:16,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1022/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.7720173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43476 samples/s/p 4:53:51 } +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1024/ 1625], loss: 1.382, per_step_time: 1474ms, lr: 2.7716818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42564 samples/s/p 4:54:18 } +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1026/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.771346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43132 samples/s/p 4:53:56 } +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1028/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.7710103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43513 samples/s/p 4:53:41 } +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1030/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.7706741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42857 samples/s/p 4:53:59 } +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1032/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.7703378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:31,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.44177 samples/s/p 4:53:14 } +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1034/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7700013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43711 samples/s/p 4:53:26 } +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.7696644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43949 samples/s/p 4:53:15 } +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1038/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.7693275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43531 samples/s/p 4:53:26 } +2024-07-25 20:15:42,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1040/ 1625], loss: 1.193, per_step_time: 1474ms, lr: 2.7689903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:42,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42392 samples/s/p 4:54:00 } +2024-07-25 20:15:45,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1042/ 1625], loss: 0.997, per_step_time: 1470ms, lr: 2.7686527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:45,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43934 samples/s/p 4:53:07 } +2024-07-25 20:15:48,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1044/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.768315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:48,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43107 samples/s/p 4:53:31 } +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1046/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.7679771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43550 samples/s/p 4:53:13 } +2024-07-25 20:15:54,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1048/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.7676391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:54,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43823 samples/s/p 4:53:02 } +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1050/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7673008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43620 samples/s/p 4:53:05 } +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1052/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.766962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43309 samples/s/p 4:53:12 } +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1054/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.7666232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43797 samples/s/p 4:52:54 } +2024-07-25 20:16:06,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1056/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.766284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:06,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43023 samples/s/p 4:53:16 } +2024-07-25 20:16:09,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1058/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.765945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:09,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43819 samples/s/p 4:52:47 } +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1060/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.7656057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42823 samples/s/p 4:53:16 } +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1062/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.7652659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43138 samples/s/p 4:53:03 } +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1064/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.764926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42994 samples/s/p 4:53:05 } +2024-07-25 20:16:21,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1066/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 2.764586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:21,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43731 samples/s/p 4:52:38 } +2024-07-25 20:16:24,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1068/ 1625], loss: 1.314, per_step_time: 1474ms, lr: 2.7642454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.42731 samples/s/p 4:53:08 } +2024-07-25 20:16:27,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1070/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.763905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:27,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43708 samples/s/p 4:52:33 } +2024-07-25 20:16:30,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1072/ 1625], loss: 1.266, per_step_time: 1484ms, lr: 2.763564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:30,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.39069 samples/s/p 4:55:01 } +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1074/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.7632228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43953 samples/s/p 4:52:19 } +2024-07-25 20:16:36,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1076/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.7628816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:36,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43447 samples/s/p 4:52:33 } +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1078/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 2.7625401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43811 samples/s/p 4:52:18 } +2024-07-25 20:16:41,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1080/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.7621985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:41,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43889 samples/s/p 4:52:12 } +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1082/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7618566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43531 samples/s/p 4:52:21 } +2024-07-25 20:16:47,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1084/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.7615144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:47,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42937 samples/s/p 4:52:37 } +2024-07-25 20:16:50,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1086/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.7611719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:50,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43398 samples/s/p 4:52:20 } +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1088/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.7608294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43771 samples/s/p 4:52:05 } +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1090/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.7604865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43612 samples/s/p 4:52:07 } +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1092/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.7601433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43464 samples/s/p 4:52:09 } +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1094/ 1625], loss: 1.117, per_step_time: 1475ms, lr: 2.7598004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:02,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42285 samples/s/p 4:52:44 } +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1096/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7594568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43398 samples/s/p 4:52:05 } +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1098/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.759113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43493 samples/s/p 4:51:59 } +2024-07-25 20:17:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1100/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.758769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43821 samples/s/p 4:51:45 } +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1102/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7584249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43119 samples/s/p 4:52:05 } +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1104/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 2.7580805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43618 samples/s/p 4:51:46 } +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1106/ 1625], loss: 1.127, per_step_time: 1483ms, lr: 2.7577358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.39350 samples/s/p 4:54:01 } +2024-07-25 20:17:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1108/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.7573911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.42955 samples/s/p 4:52:01 } +2024-07-25 20:17:26,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1110/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.7570459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43820 samples/s/p 4:51:31 } +2024-07-25 20:17:29,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1112/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7567006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43575 samples/s/p 4:51:36 } +2024-07-25 20:17:32,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1114/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.756355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:32,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43750 samples/s/p 4:51:27 } +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1116/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.7560092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:35,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.44070 samples/s/p 4:51:14 } +2024-07-25 20:17:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1118/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 2.7556633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42921 samples/s/p 4:51:48 } +2024-07-25 20:17:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1120/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.7553173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43441 samples/s/p 4:51:28 } +2024-07-25 20:17:43,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1122/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7549708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42769 samples/s/p 4:51:47 } +2024-07-25 20:17:46,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1124/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.754624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:46,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43003 samples/s/p 4:51:36 } +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1126/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.7542774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42979 samples/s/p 4:51:34 } +2024-07-25 20:17:52,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1128/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.7539303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:52,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43464 samples/s/p 4:51:16 } +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1130/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.7535827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44014 samples/s/p 4:50:55 } +2024-07-25 20:17:58,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1132/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 2.7532353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44255 samples/s/p 4:50:44 } +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1134/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 2.7528875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43734 samples/s/p 4:50:58 } +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1136/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7525399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:04,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43443 samples/s/p 4:51:04 } +2024-07-25 20:18:07,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1138/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.7521915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:07,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43217 samples/s/p 4:51:09 } +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1140/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.751843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43574 samples/s/p 4:50:54 } +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1142/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.7514943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:13,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43654 samples/s/p 4:50:49 } +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1144/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.7511456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:16,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43276 samples/s/p 4:50:58 } +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1146/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.7507964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44030 samples/s/p 4:50:31 } +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1148/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 2.7504475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43478 samples/s/p 4:50:46 } +2024-07-25 20:18:25,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1150/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 2.7500977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:25,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43006 samples/s/p 4:50:58 } +2024-07-25 20:18:28,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1152/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 2.7497483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44153 samples/s/p 4:50:18 } +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1154/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.749398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44097 samples/s/p 4:50:17 } +2024-07-25 20:18:34,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1156/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 2.7490478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:34,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44031 samples/s/p 4:50:16 } +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1158/ 1625], loss: 1.337, per_step_time: 1473ms, lr: 2.7486976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.42979 samples/s/p 4:50:47 } +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1160/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.7483471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43755 samples/s/p 4:50:19 } +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1162/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.7479962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43292 samples/s/p 4:50:31 } +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1164/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.747645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43039 samples/s/p 4:50:36 } +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1166/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.7472937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43512 samples/s/p 4:50:18 } +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1168/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.7469421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42922 samples/s/p 4:50:34 } +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1170/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.7465905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:54,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43581 samples/s/p 4:50:10 } +2024-07-25 20:18:57,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1172/ 1625], loss: 1.286, per_step_time: 1475ms, lr: 2.7462385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:57,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42324 samples/s/p 4:50:47 } +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1174/ 1625], loss: 1.341, per_step_time: 1473ms, lr: 2.7458864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43005 samples/s/p 4:50:23 } +2024-07-25 20:19:03,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1176/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.745534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:03,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42897 samples/s/p 4:50:23 } +2024-07-25 20:19:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1178/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 2.7451813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42930 samples/s/p 4:50:19 } +2024-07-25 20:19:09,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1180/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.7448285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:09,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43285 samples/s/p 4:50:05 } +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1182/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7444756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43226 samples/s/p 4:50:04 } +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.7441221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43560 samples/s/p 4:49:50 } +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1186/ 1625], loss: 1.384, per_step_time: 1471ms, lr: 2.7437689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43658 samples/s/p 4:49:44 } +2024-07-25 20:19:21,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1188/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.7434153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:21,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43714 samples/s/p 4:49:39 } +2024-07-25 20:19:24,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1190/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.7430611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:24,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.44065 samples/s/p 4:49:25 } +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1192/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.742707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43148 samples/s/p 4:49:51 } +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1194/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.7423526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.42981 samples/s/p 4:49:54 } +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1196/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.7419981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43416 samples/s/p 4:49:37 } +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1198/ 1625], loss: 1.360, per_step_time: 1474ms, lr: 2.7416432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42619 samples/s/p 4:50:00 } +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1200/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.7412882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:39,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43094 samples/s/p 4:49:41 } +2024-07-25 20:19:42,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1202/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.740933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:42,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43531 samples/s/p 4:49:24 } +2024-07-25 20:19:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1204/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.7405775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43563 samples/s/p 4:49:21 } +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1206/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.7402219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43307 samples/s/p 4:49:26 } +2024-07-25 20:19:50,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1208/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.7398659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:50,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43375 samples/s/p 4:49:21 } +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1210/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 2.7395097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:53,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42934 samples/s/p 4:49:32 } +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1212/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 2.7391534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43803 samples/s/p 4:49:01 } +2024-07-25 20:19:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1214/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.7387967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.42847 samples/s/p 4:49:29 } +2024-07-25 20:20:02,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1216/ 1625], loss: 0.958, per_step_time: 1469ms, lr: 2.73844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.44432 samples/s/p 4:48:35 } +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1218/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.7380831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43412 samples/s/p 4:49:05 } +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1220/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.7377257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:08,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43713 samples/s/p 4:48:52 } +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1222/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7373682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43384 samples/s/p 4:49:00 } +2024-07-25 20:20:14,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1224/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.7370106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:14,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43588 samples/s/p 4:48:50 } +2024-07-25 20:20:17,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1226/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.7366526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:17,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43282 samples/s/p 4:48:57 } +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1228/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.7362947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43506 samples/s/p 4:48:47 } +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1230/ 1625], loss: 1.338, per_step_time: 1470ms, lr: 2.7359361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:23,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.44214 samples/s/p 4:48:22 } +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1232/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.7355776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43450 samples/s/p 4:48:43 } +2024-07-25 20:20:29,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1234/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.735219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:29,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43896 samples/s/p 4:48:26 } +2024-07-25 20:20:32,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1236/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.73486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:32,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43552 samples/s/p 4:48:34 } +2024-07-25 20:20:35,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1238/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.734501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.42676 samples/s/p 4:48:59 } +2024-07-25 20:20:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1240/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.7341417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43413 samples/s/p 4:48:32 } +2024-07-25 20:20:41,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1242/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.733782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:41,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43723 samples/s/p 4:48:19 } +2024-07-25 20:20:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1244/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.7334221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43216 samples/s/p 4:48:33 } +2024-07-25 20:20:46,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1246/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.733062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43657 samples/s/p 4:48:16 } +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1248/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.7327018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:49,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.42997 samples/s/p 4:48:34 } +2024-07-25 20:20:52,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1250/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.732341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:52,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43293 samples/s/p 4:48:21 } +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1252/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.7319802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43769 samples/s/p 4:48:03 } +2024-07-25 20:20:58,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1254/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7316195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:58,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43412 samples/s/p 4:48:12 } +2024-07-25 20:21:01,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1256/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.7312582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:01,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43667 samples/s/p 4:48:01 } +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1258/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.7308968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43735 samples/s/p 4:47:56 } +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1260/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 2.7305352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:07,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43999 samples/s/p 4:47:44 } +2024-07-25 20:21:10,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1262/ 1625], loss: 0.940, per_step_time: 1470ms, lr: 2.7301734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:10,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43965 samples/s/p 4:47:42 } +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1264/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.7298112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:13,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43944 samples/s/p 4:47:40 } +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1266/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.729449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43541 samples/s/p 4:47:50 } +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1268/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.729087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43879 samples/s/p 4:47:36 } +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1270/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.728724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43336 samples/s/p 4:47:51 } +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1272/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.7283611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43615 samples/s/p 4:47:39 } +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1274/ 1625], loss: 1.105, per_step_time: 1482ms, lr: 2.727998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.39485 samples/s/p 4:49:48 } +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1276/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.7276346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43698 samples/s/p 4:47:30 } +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1278/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.7272712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43504 samples/s/p 4:47:33 } +2024-07-25 20:21:37,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1280/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.7269074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:37,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43417 samples/s/p 4:47:33 } +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1282/ 1625], loss: 0.872, per_step_time: 1471ms, lr: 2.7265432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43763 samples/s/p 4:47:19 } +2024-07-25 20:21:43,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1284/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.7261793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:43,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43650 samples/s/p 4:47:20 } +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1286/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.725815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43190 samples/s/p 4:47:32 } +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1288/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.7254502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.42982 samples/s/p 4:47:35 } +2024-07-25 20:21:51,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1290/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.7250853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:51,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.44120 samples/s/p 4:46:56 } +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1292/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 2.72472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.42785 samples/s/p 4:47:36 } +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1294/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.7243548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43116 samples/s/p 4:47:22 } +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1296/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7239892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43532 samples/s/p 4:47:06 } +2024-07-25 20:22:03,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1298/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 2.7236234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:03,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43962 samples/s/p 4:46:50 } +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1300/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.7232578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43404 samples/s/p 4:47:04 } +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1302/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.7228914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43889 samples/s/p 4:46:46 } +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1304/ 1625], loss: 1.342, per_step_time: 1477ms, lr: 2.7225251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:12,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.41555 samples/s/p 4:47:57 } +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1306/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 2.7221586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43680 samples/s/p 4:46:47 } +2024-07-25 20:22:18,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1308/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7217915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:18,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43340 samples/s/p 4:46:54 } +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1310/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.7214248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43548 samples/s/p 4:46:45 } +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1312/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.7210575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43339 samples/s/p 4:46:49 } +2024-07-25 20:22:27,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1314/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 2.7206897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:27,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43914 samples/s/p 4:46:28 } +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1316/ 1625], loss: 1.173, per_step_time: 1474ms, lr: 2.7203223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42504 samples/s/p 4:47:09 } +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1318/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.7199543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43674 samples/s/p 4:46:29 } +2024-07-25 20:22:36,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1320/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.7195862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:36,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43747 samples/s/p 4:46:24 } +2024-07-25 20:22:39,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1322/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7192178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:39,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43296 samples/s/p 4:46:35 } +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1324/ 1625], loss: 1.350, per_step_time: 1473ms, lr: 2.7188493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42797 samples/s/p 4:46:48 } +2024-07-25 20:22:44,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1326/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.7184808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:44,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43742 samples/s/p 4:46:15 } +2024-07-25 20:22:47,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1328/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.7181119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:47,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43845 samples/s/p 4:46:09 } +2024-07-25 20:22:50,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1330/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.7177426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:50,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43362 samples/s/p 4:46:21 } +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1332/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 2.7173732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:53,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.44084 samples/s/p 4:45:56 } +2024-07-25 20:22:56,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1334/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7170036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:56,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43627 samples/s/p 4:46:07 } +2024-07-25 20:22:59,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1336/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7166338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43561 samples/s/p 4:46:06 } +2024-07-25 20:23:02,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1338/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.7162638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:02,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.42809 samples/s/p 4:46:27 } +2024-07-25 20:23:05,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1340/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7158934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:05,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43700 samples/s/p 4:45:56 } +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1342/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7155229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43613 samples/s/p 4:45:56 } +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1344/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.7151524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43869 samples/s/p 4:45:45 } +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1346/ 1625], loss: 0.929, per_step_time: 1471ms, lr: 2.7147813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43514 samples/s/p 4:45:53 } +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1348/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7144102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43511 samples/s/p 4:45:50 } +2024-07-25 20:23:20,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1350/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.7140388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:20,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43415 samples/s/p 4:45:50 } +2024-07-25 20:23:23,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1352/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.7136673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:23,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43431 samples/s/p 4:45:47 } +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1354/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7132955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43623 samples/s/p 4:45:38 } +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1356/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.7129236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:29,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43099 samples/s/p 4:45:51 } +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1358/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 2.7125512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.44196 samples/s/p 4:45:14 } +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1360/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.712179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43072 samples/s/p 4:45:46 } +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1362/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.7118065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42960 samples/s/p 4:45:47 } +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1364/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 2.7114334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43082 samples/s/p 4:45:40 } +2024-07-25 20:23:44,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1366/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 2.7110606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:44,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42867 samples/s/p 4:45:44 } +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1368/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7106873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43224 samples/s/p 4:45:30 } +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1370/ 1625], loss: 1.202, per_step_time: 1481ms, lr: 2.7103139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.40092 samples/s/p 4:47:06 } +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1372/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.70994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43628 samples/s/p 4:45:11 } +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.709566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43655 samples/s/p 4:45:07 } +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1376/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.7091919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42946 samples/s/p 4:45:27 } +2024-07-25 20:24:01,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1378/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.7088177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:01,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43563 samples/s/p 4:45:04 } +2024-07-25 20:24:04,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1380/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.7084432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:04,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42992 samples/s/p 4:45:19 } +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1382/ 1625], loss: 1.086, per_step_time: 1483ms, lr: 2.7080683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.39268 samples/s/p 4:47:15 } +2024-07-25 20:24:10,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1384/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.7076932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:10,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43502 samples/s/p 4:44:58 } +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1386/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7073182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43611 samples/s/p 4:44:51 } +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1388/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.7069427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:16,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43063 samples/s/p 4:45:05 } +2024-07-25 20:24:19,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1390/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.706567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:19,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43107 samples/s/p 4:45:01 } +2024-07-25 20:24:22,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1392/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7061913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:22,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42917 samples/s/p 4:45:04 } +2024-07-25 20:24:25,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1394/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 2.7058151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:25,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42556 samples/s/p 4:45:13 } +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1396/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.705439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43742 samples/s/p 4:44:32 } +2024-07-25 20:24:31,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1398/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.7050624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:31,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42900 samples/s/p 4:44:56 } +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1400/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.7046857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43977 samples/s/p 4:44:19 } +2024-07-25 20:24:37,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1402/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.7043088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:37,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43542 samples/s/p 4:44:30 } +2024-07-25 20:24:40,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1404/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 2.7039318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:40,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43772 samples/s/p 4:44:20 } +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1406/ 1625], loss: 1.244, per_step_time: 1473ms, lr: 2.7035543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42862 samples/s/p 4:44:45 } +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1408/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.703177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43229 samples/s/p 4:44:31 } +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1410/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.702799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42763 samples/s/p 4:44:42 } +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1412/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.7024213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43266 samples/s/p 4:44:24 } +2024-07-25 20:24:54,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1414/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 2.702043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43800 samples/s/p 4:44:04 } +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.7016647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43604 samples/s/p 4:44:07 } +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1418/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7012862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43667 samples/s/p 4:44:02 } +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1420/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.7009073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43180 samples/s/p 4:44:15 } +2024-07-25 20:25:06,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.7005282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:06,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43323 samples/s/p 4:44:07 } +2024-07-25 20:25:09,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1424/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.700149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:09,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43424 samples/s/p 4:44:01 } +2024-07-25 20:25:12,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1426/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.6997694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:12,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43756 samples/s/p 4:43:48 } +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1428/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6993897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43226 samples/s/p 4:44:01 } +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1430/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.69901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43552 samples/s/p 4:43:48 } +2024-07-25 20:25:21,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1432/ 1625], loss: 1.159, per_step_time: 1475ms, lr: 2.69863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:21,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42252 samples/s/p 4:44:26 } +2024-07-25 20:25:24,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1434/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.6982496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:24,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43358 samples/s/p 4:43:48 } +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1436/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.697869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42889 samples/s/p 4:44:00 } +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1438/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.6974883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.44055 samples/s/p 4:43:21 } +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1440/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.6971074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43357 samples/s/p 4:43:40 } +2024-07-25 20:25:36,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1442/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.6967262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:36,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43797 samples/s/p 4:43:23 } +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1444/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.6963447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:39,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43163 samples/s/p 4:43:40 } +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1446/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.6959635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43504 samples/s/p 4:43:26 } +2024-07-25 20:25:45,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1448/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.6955817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:45,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43437 samples/s/p 4:43:25 } +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1450/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.6951997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:48,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43714 samples/s/p 4:43:14 } +2024-07-25 20:25:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1452/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.6948175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:50,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.44021 samples/s/p 4:43:01 } +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1454/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.6944352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43572 samples/s/p 4:43:12 } +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1456/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 2.6940525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:56,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.44350 samples/s/p 4:42:45 } +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1458/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.6936696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43238 samples/s/p 4:43:17 } +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1460/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.6932865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:02,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43653 samples/s/p 4:43:01 } +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1462/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.6929032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:05,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43840 samples/s/p 4:42:52 } +2024-07-25 20:26:08,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1464/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.69252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:08,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42842 samples/s/p 4:43:20 } +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1466/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.6921361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43022 samples/s/p 4:43:12 } +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1468/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.6917522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:14,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43441 samples/s/p 4:42:56 } +2024-07-25 20:26:17,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1470/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.691368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:17,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43442 samples/s/p 4:42:53 } +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1472/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 2.6909836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:20,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.42955 samples/s/p 4:43:05 } +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1474/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.6905991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43663 samples/s/p 4:42:40 } +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1476/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6902144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43326 samples/s/p 4:42:48 } +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1478/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.6898295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43069 samples/s/p 4:42:53 } +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1480/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 2.6894442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.44267 samples/s/p 4:42:12 } +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1482/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.689059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43464 samples/s/p 4:42:34 } +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1484/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6886732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43493 samples/s/p 4:42:31 } +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1486/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.6882875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43969 samples/s/p 4:42:13 } +2024-07-25 20:26:44,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1488/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 2.6879015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:44,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43541 samples/s/p 4:42:23 } +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1490/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.6875154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43376 samples/s/p 4:42:25 } +2024-07-25 20:26:50,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 2.687129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:50,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43091 samples/s/p 4:42:31 } +2024-07-25 20:26:52,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1494/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.6867421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:52,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43663 samples/s/p 4:42:11 } +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1496/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.6863554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43956 samples/s/p 4:41:59 } +2024-07-25 20:26:58,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1498/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.6859683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:58,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43425 samples/s/p 4:42:12 } +2024-07-25 20:27:01,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1500/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.685581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:01,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43638 samples/s/p 4:42:03 } +2024-07-25 20:27:04,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1502/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.6851938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:04,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43647 samples/s/p 4:41:59 } +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1504/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.6848062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43482 samples/s/p 4:42:01 } +2024-07-25 20:27:10,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1506/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.6844182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:10,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43589 samples/s/p 4:41:55 } +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1508/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.68403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:13,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43661 samples/s/p 4:41:50 } +2024-07-25 20:27:16,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1510/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 2.6836418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:16,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.42995 samples/s/p 4:42:08 } +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1512/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6832533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43050 samples/s/p 4:42:03 } +2024-07-25 20:27:22,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1514/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.6828646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:22,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43545 samples/s/p 4:41:45 } +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1516/ 1625], loss: 1.383, per_step_time: 1469ms, lr: 2.6824755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.44307 samples/s/p 4:41:18 } +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1518/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.6820864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43777 samples/s/p 4:41:32 } +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1520/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6816972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:31,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43342 samples/s/p 4:41:42 } +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.6813075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42684 samples/s/p 4:42:00 } +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1524/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.6809177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42804 samples/s/p 4:41:53 } +2024-07-25 20:27:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1526/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.6805277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:40,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43399 samples/s/p 4:41:32 } +2024-07-25 20:27:43,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1528/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 2.6801375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:43,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43901 samples/s/p 4:41:13 } +2024-07-25 20:27:46,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1530/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.679747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:46,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42893 samples/s/p 4:41:42 } +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1532/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.6793565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43449 samples/s/p 4:41:21 } +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1534/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6789658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43500 samples/s/p 4:41:17 } +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1536/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6785747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43205 samples/s/p 4:41:23 } +2024-07-25 20:27:57,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1538/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.6781836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:57,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.42537 samples/s/p 4:41:41 } +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1540/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.6777923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43768 samples/s/p 4:41:00 } +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1542/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.6774005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43900 samples/s/p 4:40:53 } +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1544/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.6770087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43849 samples/s/p 4:40:51 } +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1546/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.6766167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43275 samples/s/p 4:41:06 } +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1548/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.6762244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43475 samples/s/p 4:40:57 } +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1550/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.675832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43326 samples/s/p 4:40:59 } +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1552/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.6754393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43862 samples/s/p 4:40:39 } +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1554/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.6750464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:21,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.42862 samples/s/p 4:41:07 } +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1556/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.6746531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43930 samples/s/p 4:40:31 } +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1558/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.67426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43609 samples/s/p 4:40:38 } +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1560/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6738662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:30,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43786 samples/s/p 4:40:30 } +2024-07-25 20:28:33,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1562/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.6734724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:33,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43975 samples/s/p 4:40:21 } +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1564/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 2.6730788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43938 samples/s/p 4:40:19 } +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1566/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.6726846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43508 samples/s/p 4:40:29 } +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1568/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.67229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43816 samples/s/p 4:40:17 } +2024-07-25 20:28:45,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1570/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.6718957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:45,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43386 samples/s/p 4:40:27 } +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1572/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.671501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43180 samples/s/p 4:40:31 } +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1574/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.6711057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43504 samples/s/p 4:40:18 } +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1576/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.6707106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.42792 samples/s/p 4:40:37 } +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1578/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.6703154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:56,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43907 samples/s/p 4:39:59 } +2024-07-25 20:28:59,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1580/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6699196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:59,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43579 samples/s/p 4:40:07 } +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1582/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.6695237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44103 samples/s/p 4:39:47 } +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1584/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 2.669128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44036 samples/s/p 4:39:47 } +2024-07-25 20:29:08,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1586/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.6687318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43562 samples/s/p 4:39:58 } +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1588/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6683352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:11,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43378 samples/s/p 4:40:01 } +2024-07-25 20:29:14,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1590/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.6679389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:14,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43808 samples/s/p 4:39:45 } +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1592/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.667542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43387 samples/s/p 4:39:55 } +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1594/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.667145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43167 samples/s/p 4:39:59 } +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1596/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 2.6667478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43379 samples/s/p 4:39:49 } +2024-07-25 20:29:26,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1598/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6663502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:26,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43544 samples/s/p 4:39:41 } +2024-07-25 20:29:29,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1600/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.6659527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:29,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43783 samples/s/p 4:39:31 } +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1602/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 2.6655547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43056 samples/s/p 4:39:50 } +2024-07-25 20:29:35,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1604/ 1625], loss: 1.150, per_step_time: 1481ms, lr: 2.6651567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:35,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.40116 samples/s/p 4:41:19 } +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1606/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 2.6647582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.42799 samples/s/p 4:39:52 } +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1608/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.66436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43282 samples/s/p 4:39:35 } +2024-07-25 20:29:44,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1610/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6639615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43584 samples/s/p 4:39:22 } +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1612/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6635624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43763 samples/s/p 4:39:14 } +2024-07-25 20:29:50,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1614/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.6631631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:50,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43207 samples/s/p 4:39:28 } +2024-07-25 20:29:53,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1616/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.6627638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:53,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43279 samples/s/p 4:39:23 } +2024-07-25 20:29:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1618/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.6623644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43839 samples/s/p 4:39:03 } +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1620/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.6619646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:58,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43137 samples/s/p 4:39:21 } +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1622/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.6615648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43344 samples/s/p 4:39:12 } +2024-07-25 20:30:04,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1624/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.661165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:04,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43760 samples/s/p 4:38:56 } +2024-07-25 20:30:07,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.6607646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43463 samples/s/p 4:39:03 } +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 3/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.660364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43720 samples/s/p 4:38:52 } +2024-07-25 20:30:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 5/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6599633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:13,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43761 samples/s/p 4:38:47 } +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 7/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.6595622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.44083 samples/s/p 4:38:35 } +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 9/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.6591613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43520 samples/s/p 4:38:49 } +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 11/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.6587599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43834 samples/s/p 4:38:36 } +2024-07-25 20:30:25,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 13/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.6583582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:25,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.42876 samples/s/p 4:39:03 } +2024-07-25 20:30:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 15/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6579564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43804 samples/s/p 4:38:31 } +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 17/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6575546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43417 samples/s/p 4:38:40 } +2024-07-25 20:30:34,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 19/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6571523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:34,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43336 samples/s/p 4:38:40 } +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 21/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.6567499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43806 samples/s/p 4:38:23 } +2024-07-25 20:30:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 23/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6563475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43393 samples/s/p 4:38:32 } +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 25/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.6559446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43255 samples/s/p 4:38:34 } +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 27/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6555417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43608 samples/s/p 4:38:20 } +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 29/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.6551385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43467 samples/s/p 4:38:21 } +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 31/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.654735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:52,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43784 samples/s/p 4:38:08 } +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 33/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 2.6543314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43735 samples/s/p 4:38:07 } +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 35/ 1625], loss: 1.309, per_step_time: 1471ms, lr: 2.6539275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43531 samples/s/p 4:38:10 } +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 37/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.6535236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43603 samples/s/p 4:38:05 } +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 39/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.6531194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43452 samples/s/p 4:38:07 } +2024-07-25 20:31:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 41/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.652715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43257 samples/s/p 4:38:10 } +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 43/ 1625], loss: 1.054, per_step_time: 1473ms, lr: 2.6523103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:09,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.42915 samples/s/p 4:38:18 } +2024-07-25 20:31:12,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 45/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.6519056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:12,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43669 samples/s/p 4:37:51 } +2024-07-25 20:31:15,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 47/ 1625], loss: 1.002, per_step_time: 1472ms, lr: 2.6515005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:15,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43473 samples/s/p 4:37:54 } +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 49/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.6510952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43274 samples/s/p 4:37:58 } +2024-07-25 20:31:21,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 51/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.6506901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:21,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43553 samples/s/p 4:37:46 } +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 53/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.6502841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:24,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43880 samples/s/p 4:37:33 } +2024-07-25 20:31:27,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 55/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 2.6498787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:27,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43226 samples/s/p 4:37:50 } +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 57/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.6494725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43342 samples/s/p 4:37:44 } +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 59/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 2.6490663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:33,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43229 samples/s/p 4:37:44 } +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 61/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.64866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:36,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44036 samples/s/p 4:37:17 } +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 63/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6482532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:39,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43357 samples/s/p 4:37:34 } +2024-07-25 20:31:42,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 65/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.6478463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:42,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43659 samples/s/p 4:37:22 } +2024-07-25 20:31:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 67/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.6474394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43105 samples/s/p 4:37:36 } +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 69/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 2.6470321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:48,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43849 samples/s/p 4:37:11 } +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 71/ 1625], loss: 1.243, per_step_time: 1469ms, lr: 2.6466245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44238 samples/s/p 4:36:56 } +2024-07-25 20:31:53,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 73/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 2.6462169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:53,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43901 samples/s/p 4:37:03 } +2024-07-25 20:31:56,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 75/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 2.645809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:56,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43850 samples/s/p 4:37:02 } +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 77/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.645401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43596 samples/s/p 4:37:07 } +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 79/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.6449929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43298 samples/s/p 4:37:13 } +2024-07-25 20:32:05,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 81/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.6445841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:05,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43197 samples/s/p 4:37:13 } +2024-07-25 20:32:08,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 83/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.6441756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43829 samples/s/p 4:36:51 } +2024-07-25 20:32:11,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 85/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 2.6437665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:11,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43510 samples/s/p 4:36:57 } +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 87/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.6433578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:14,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43473 samples/s/p 4:36:56 } +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 89/ 1625], loss: 0.988, per_step_time: 1472ms, lr: 2.6429483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43379 samples/s/p 4:36:56 } +2024-07-25 20:32:20,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 91/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.642539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:20,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43592 samples/s/p 4:36:46 } +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 93/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.6421292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43352 samples/s/p 4:36:50 } +2024-07-25 20:32:26,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 95/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.6417194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:26,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43760 samples/s/p 4:36:35 } +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 97/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.6413092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43432 samples/s/p 4:36:42 } +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 99/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.640899e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43817 samples/s/p 4:36:27 } +2024-07-25 20:32:35,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 101/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.6404885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:35,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.44108 samples/s/p 4:36:16 } +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 103/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.640078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43321 samples/s/p 4:36:37 } +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 105/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.639667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43151 samples/s/p 4:36:39 } +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 107/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.639256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:44,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43834 samples/s/p 4:36:15 } +2024-07-25 20:32:47,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 109/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6388447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:47,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43702 samples/s/p 4:36:16 } +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 111/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.6384332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.44269 samples/s/p 4:35:56 } +2024-07-25 20:32:52,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 113/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.6380214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:52,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43731 samples/s/p 4:36:09 } +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 115/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.6376096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:55,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43160 samples/s/p 4:36:24 } +2024-07-25 20:32:58,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 117/ 1625], loss: 1.172, per_step_time: 1474ms, lr: 2.6371974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:58,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42504 samples/s/p 4:36:41 } +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 119/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.6367852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42591 samples/s/p 4:36:35 } +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 121/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.6363727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43450 samples/s/p 4:36:06 } +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 123/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.63596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:07,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43743 samples/s/p 4:35:54 } +2024-07-25 20:33:10,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 125/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.635547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:10,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43789 samples/s/p 4:35:50 } +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 127/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.635134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:13,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43154 samples/s/p 4:36:06 } +2024-07-25 20:33:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 129/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6347207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.44049 samples/s/p 4:35:36 } +2024-07-25 20:33:19,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 131/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.6343072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43628 samples/s/p 4:35:46 } +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 133/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.6338936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43746 samples/s/p 4:35:40 } +2024-07-25 20:33:25,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 135/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.6334796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:25,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43008 samples/s/p 4:35:59 } +2024-07-25 20:33:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 137/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.6330656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:28,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43836 samples/s/p 4:35:31 } +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 139/ 1625], loss: 1.209, per_step_time: 1474ms, lr: 2.632651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.42543 samples/s/p 4:36:07 } +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 141/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.6322365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:34,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43815 samples/s/p 4:35:26 } +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 143/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.6318221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43743 samples/s/p 4:35:25 } +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 145/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.631407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43145 samples/s/p 4:35:40 } +2024-07-25 20:33:43,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 147/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.6309921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:43,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43345 samples/s/p 4:35:31 } +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 149/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 2.6305768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43635 samples/s/p 4:35:19 } +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 151/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.6301614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43850 samples/s/p 4:35:10 } +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 153/ 1625], loss: 1.080, per_step_time: 1469ms, lr: 2.6297457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:52,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.44324 samples/s/p 4:34:53 } +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 155/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.6293299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43945 samples/s/p 4:35:01 } +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 157/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.6289135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43836 samples/s/p 4:35:02 } +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 159/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.6284974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43672 samples/s/p 4:35:04 } +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 161/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 2.6280808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43188 samples/s/p 4:35:15 } +2024-07-25 20:34:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 163/ 1625], loss: 1.125, per_step_time: 1474ms, lr: 2.6276643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42454 samples/s/p 4:35:35 } +2024-07-25 20:34:09,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 165/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.6272473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43992 samples/s/p 4:34:45 } +2024-07-25 20:34:12,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 167/ 1625], loss: 1.246, per_step_time: 1474ms, lr: 2.6268302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:12,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42485 samples/s/p 4:35:28 } +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 169/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.6264128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42810 samples/s/p 4:35:15 } +2024-07-25 20:34:18,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 171/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.6259953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:18,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43589 samples/s/p 4:34:48 } +2024-07-25 20:34:21,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 173/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6255777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:21,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43435 samples/s/p 4:34:50 } +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 175/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.6251599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43197 samples/s/p 4:34:54 } +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 177/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.624742e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43446 samples/s/p 4:34:44 } +2024-07-25 20:34:30,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 179/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.6243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:30,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43052 samples/s/p 4:34:53 } +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 181/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 2.6239051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43776 samples/s/p 4:34:28 } +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 183/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.6234866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:36,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43807 samples/s/p 4:34:24 } +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 185/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.6230677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43193 samples/s/p 4:34:40 } +2024-07-25 20:34:42,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 187/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.6226486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:42,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42466 samples/s/p 4:34:59 } +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 189/ 1625], loss: 1.125, per_step_time: 1469ms, lr: 2.6222293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:45,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.44517 samples/s/p 4:33:54 } +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 191/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.6218097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43305 samples/s/p 4:34:28 } +2024-07-25 20:34:51,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 193/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.6213902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:51,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43132 samples/s/p 4:34:30 } +2024-07-25 20:34:54,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 195/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.6209704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:54,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43292 samples/s/p 4:34:22 } +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 197/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 2.6205502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43057 samples/s/p 4:34:26 } +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 199/ 1625], loss: 1.157, per_step_time: 1474ms, lr: 2.6201298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42385 samples/s/p 4:34:44 } +2024-07-25 20:35:02,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 201/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.6197094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:02,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42994 samples/s/p 4:34:22 } +2024-07-25 20:35:05,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 203/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.6192887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:05,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42949 samples/s/p 4:34:21 } +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 205/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.618868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43572 samples/s/p 4:33:59 } +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 207/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.618447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:11,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43575 samples/s/p 4:33:56 } +2024-07-25 20:35:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 209/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.6180256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:14,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43802 samples/s/p 4:33:46 } +2024-07-25 20:35:17,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 211/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 2.6176042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:17,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43704 samples/s/p 4:33:46 } +2024-07-25 20:35:20,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 213/ 1625], loss: 1.308, per_step_time: 1470ms, lr: 2.6171825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:20,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43982 samples/s/p 4:33:35 } +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 215/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.6167607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:23,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43544 samples/s/p 4:33:45 } +2024-07-25 20:35:26,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 217/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6163387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:26,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43343 samples/s/p 4:33:48 } +2024-07-25 20:35:29,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 219/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.6159165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43635 samples/s/p 4:33:36 } +2024-07-25 20:35:32,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 221/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.615494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:32,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43700 samples/s/p 4:33:31 } +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 223/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.6150716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43828 samples/s/p 4:33:25 } +2024-07-25 20:35:38,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 225/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.6146485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.42956 samples/s/p 4:33:48 } +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 227/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 2.6142256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43864 samples/s/p 4:33:18 } +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 229/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6138026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43707 samples/s/p 4:33:20 } +2024-07-25 20:35:47,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 231/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.613379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:47,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43747 samples/s/p 4:33:15 } +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 233/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.6129554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43253 samples/s/p 4:33:27 } +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 235/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.6125317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43654 samples/s/p 4:33:12 } +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.6121077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43652 samples/s/p 4:33:09 } +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 239/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.6116835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43606 samples/s/p 4:33:08 } +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 241/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.611259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43634 samples/s/p 4:33:04 } +2024-07-25 20:36:04,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 243/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 2.6108346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:04,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.42960 samples/s/p 4:33:21 } +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 2.6104097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43876 samples/s/p 4:32:51 } +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 247/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.6099848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43101 samples/s/p 4:33:11 } +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 249/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.6095595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.44103 samples/s/p 4:32:38 } +2024-07-25 20:36:16,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 251/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6091344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:16,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43603 samples/s/p 4:32:50 } +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 253/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.6087086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43778 samples/s/p 4:32:42 } +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 255/ 1625], loss: 1.192, per_step_time: 1475ms, lr: 2.608283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:22,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42340 samples/s/p 4:33:22 } +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 257/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.607857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43794 samples/s/p 4:32:36 } +2024-07-25 20:36:28,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 259/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.6074307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:28,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.44193 samples/s/p 4:32:21 } +2024-07-25 20:36:31,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 261/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 2.6070044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43143 samples/s/p 4:32:49 } +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 263/ 1625], loss: 1.043, per_step_time: 1473ms, lr: 2.6065778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:34,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42747 samples/s/p 4:32:58 } +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 265/ 1625], loss: 1.276, per_step_time: 1470ms, lr: 2.6061514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43861 samples/s/p 4:32:22 } +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 267/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.6057243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43634 samples/s/p 4:32:26 } +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 269/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.6052974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44222 samples/s/p 4:32:05 } +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 271/ 1625], loss: 1.017, per_step_time: 1473ms, lr: 2.6048701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43095 samples/s/p 4:32:36 } +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 273/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.6044425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43669 samples/s/p 4:32:16 } +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 275/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.6040148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43678 samples/s/p 4:32:13 } +2024-07-25 20:36:54,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 277/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.6035868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:54,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44149 samples/s/p 4:31:56 } +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 279/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 2.6031588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.42666 samples/s/p 4:32:37 } +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 281/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.6027305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43449 samples/s/p 4:32:11 } +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 283/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.6023019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:03,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43449 samples/s/p 4:32:08 } +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 285/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.6018733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43335 samples/s/p 4:32:08 } +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 287/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.6014444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43188 samples/s/p 4:32:10 } +2024-07-25 20:37:12,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 289/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.6010153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:12,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43979 samples/s/p 4:31:43 } +2024-07-25 20:37:15,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 291/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.600586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43078 samples/s/p 4:32:07 } +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 293/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.6001566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43118 samples/s/p 4:32:03 } +2024-07-25 20:37:21,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 295/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.599727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:21,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43587 samples/s/p 4:31:46 } +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 297/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.5992971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43522 samples/s/p 4:31:45 } +2024-07-25 20:37:27,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 299/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.5988671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:27,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43756 samples/s/p 4:31:35 } +2024-07-25 20:37:30,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 301/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.5984367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:30,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43474 samples/s/p 4:31:41 } +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 303/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.5980064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43205 samples/s/p 4:31:46 } +2024-07-25 20:37:36,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 305/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.5975756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:36,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43603 samples/s/p 4:31:31 } +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 307/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 2.5971449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.42990 samples/s/p 4:31:46 } +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 309/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.596714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43669 samples/s/p 4:31:23 } +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 311/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.5962827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:45,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43961 samples/s/p 4:31:11 } +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 313/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.5958512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43620 samples/s/p 4:31:19 } +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 315/ 1625], loss: 1.389, per_step_time: 1471ms, lr: 2.5954198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43503 samples/s/p 4:31:19 } +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 317/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 2.594988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43479 samples/s/p 4:31:17 } +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 319/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.594556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43711 samples/s/p 4:31:07 } +2024-07-25 20:37:59,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 321/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.594124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:59,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43173 samples/s/p 4:31:20 } +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 323/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 2.5936914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:02,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.44055 samples/s/p 4:30:51 } +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 325/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.5932592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43711 samples/s/p 4:30:58 } +2024-07-25 20:38:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 327/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5928262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:08,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44194 samples/s/p 4:30:41 } +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 329/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.5923935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:11,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43320 samples/s/p 4:31:04 } +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 331/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.5919602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:14,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43921 samples/s/p 4:30:43 } +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 333/ 1625], loss: 1.221, per_step_time: 1469ms, lr: 2.591527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44470 samples/s/p 4:30:24 } +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 335/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.5910935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:20,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43309 samples/s/p 4:30:55 } +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 337/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.5906598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43670 samples/s/p 4:30:42 } +2024-07-25 20:38:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 339/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.5902258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43581 samples/s/p 4:30:41 } +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 341/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.5897916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43160 samples/s/p 4:30:51 } +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 343/ 1625], loss: 0.974, per_step_time: 1470ms, lr: 2.5893574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:32,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.44032 samples/s/p 4:30:22 } +2024-07-25 20:38:35,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 345/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 2.5889229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:35,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43446 samples/s/p 4:30:37 } +2024-07-25 20:38:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 347/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 2.5884883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:38,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43292 samples/s/p 4:30:38 } +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 349/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 2.5880534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.42993 samples/s/p 4:30:44 } +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 351/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5876187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43509 samples/s/p 4:30:26 } +2024-07-25 20:38:47,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 353/ 1625], loss: 1.186, per_step_time: 1475ms, lr: 2.5871832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:47,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.42276 samples/s/p 4:31:00 } +2024-07-25 20:38:50,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 355/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.5867479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43283 samples/s/p 4:30:27 } +2024-07-25 20:38:53,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 357/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5863124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:53,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.44079 samples/s/p 4:30:00 } +2024-07-25 20:38:55,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 359/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.5858766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:55,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43589 samples/s/p 4:30:12 } +2024-07-25 20:38:58,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 361/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5854404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:58,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43584 samples/s/p 4:30:09 } +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 363/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.5850044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43538 samples/s/p 4:30:07 } +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 365/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.5845678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43726 samples/s/p 4:29:59 } +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.5841315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43614 samples/s/p 4:29:59 } +2024-07-25 20:39:10,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 369/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.5836945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:10,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44271 samples/s/p 4:29:37 } +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 371/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.5832576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43384 samples/s/p 4:30:00 } +2024-07-25 20:39:16,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 373/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5828205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:16,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43351 samples/s/p 4:29:58 } +2024-07-25 20:39:19,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 375/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.5823832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:19,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43290 samples/s/p 4:29:57 } +2024-07-25 20:39:22,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 377/ 1625], loss: 0.949, per_step_time: 1468ms, lr: 2.5819456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:22,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44601 samples/s/p 4:29:15 } +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 379/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.581508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43056 samples/s/p 4:29:58 } +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 381/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.58107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43620 samples/s/p 4:29:38 } +2024-07-25 20:39:31,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 383/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.580632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:31,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43208 samples/s/p 4:29:48 } +2024-07-25 20:39:34,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 385/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5801935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:34,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44031 samples/s/p 4:29:20 } +2024-07-25 20:39:37,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 387/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.5797552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:37,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44196 samples/s/p 4:29:13 } +2024-07-25 20:39:40,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 389/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.5793164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:40,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.42182 samples/s/p 4:30:10 } +2024-07-25 20:39:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 391/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.5788773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:43,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43461 samples/s/p 4:29:28 } +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 393/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.5784384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43374 samples/s/p 4:29:28 } +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 395/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.5779993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:49,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43222 samples/s/p 4:29:30 } +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 397/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.5775596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43236 samples/s/p 4:29:26 } +2024-07-25 20:39:55,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 399/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.5771202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:55,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43567 samples/s/p 4:29:14 } +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 401/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5766803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43178 samples/s/p 4:29:22 } +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 403/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.5762403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:00,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43256 samples/s/p 4:29:17 } +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 405/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.5758001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43762 samples/s/p 4:28:59 } +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 407/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 2.57536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43010 samples/s/p 4:29:18 } +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 409/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.5749192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43714 samples/s/p 4:28:54 } +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 411/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.5744786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:12,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43757 samples/s/p 4:28:50 } +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 413/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.5740377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42825 samples/s/p 4:29:15 } +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 415/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.5735966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43900 samples/s/p 4:28:40 } +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 417/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 2.5731553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43665 samples/s/p 4:28:44 } +2024-07-25 20:40:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 419/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5727139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:24,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43724 samples/s/p 4:28:39 } +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 421/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.572272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43372 samples/s/p 4:28:47 } +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 423/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 2.5718302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43108 samples/s/p 4:28:52 } +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 425/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.571388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:33,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43488 samples/s/p 4:28:38 } +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 427/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.5709458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43083 samples/s/p 4:28:47 } +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 429/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.5705032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43756 samples/s/p 4:28:24 } +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 431/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.5700607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.42699 samples/s/p 4:28:52 } +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 433/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.5696178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43648 samples/s/p 4:28:21 } +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 435/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.5691748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43244 samples/s/p 4:28:30 } +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 437/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.5687315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43238 samples/s/p 4:28:27 } +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 439/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.5682884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:54,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43551 samples/s/p 4:28:15 } +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 441/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.5678448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43936 samples/s/p 4:28:01 } +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 443/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.5674008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43870 samples/s/p 4:28:00 } +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 445/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.5669571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43271 samples/s/p 4:28:15 } +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 447/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.5665127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:05,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43613 samples/s/p 4:28:02 } +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 449/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.5660685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43931 samples/s/p 4:27:49 } +2024-07-25 20:41:11,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 451/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.565624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:11,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43352 samples/s/p 4:28:03 } +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 453/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.5651794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43798 samples/s/p 4:27:47 } +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 455/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 2.5647345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43576 samples/s/p 4:27:51 } +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 457/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.5642892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43234 samples/s/p 4:27:58 } +2024-07-25 20:41:23,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 459/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.563844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43745 samples/s/p 4:27:40 } +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 461/ 1625], loss: 1.362, per_step_time: 1472ms, lr: 2.5633986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:26,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43357 samples/s/p 4:27:48 } +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 463/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.562953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43717 samples/s/p 4:27:35 } +2024-07-25 20:41:32,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 465/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 2.5625071e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:32,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43965 samples/s/p 4:27:25 } +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 467/ 1625], loss: 1.282, per_step_time: 1469ms, lr: 2.5620611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.44330 samples/s/p 4:27:11 } +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 469/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.561615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:38,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43028 samples/s/p 4:27:46 } +2024-07-25 20:41:41,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 471/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.5611685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43715 samples/s/p 4:27:23 } +2024-07-25 20:41:44,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 473/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.5607218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:44,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43493 samples/s/p 4:27:27 } +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 475/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.560275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43291 samples/s/p 4:27:30 } +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 477/ 1625], loss: 0.968, per_step_time: 1471ms, lr: 2.5598283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43808 samples/s/p 4:27:12 } +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 479/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.559381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:53,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43275 samples/s/p 4:27:24 } +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 481/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 2.5589337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43312 samples/s/p 4:27:20 } +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 483/ 1625], loss: 0.845, per_step_time: 1472ms, lr: 2.5584863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43440 samples/s/p 4:27:14 } +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 485/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 2.5580384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:01,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43398 samples/s/p 4:27:12 } +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 487/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.5575904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:04,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43679 samples/s/p 4:27:01 } +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 489/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.5571424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:07,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43488 samples/s/p 4:27:03 } +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 491/ 1625], loss: 0.914, per_step_time: 1470ms, lr: 2.5566942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:10,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43900 samples/s/p 4:26:48 } +2024-07-25 20:42:13,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 493/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.5562456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:13,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43624 samples/s/p 4:26:54 } +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 495/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.5557973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43410 samples/s/p 4:26:57 } +2024-07-25 20:42:19,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 497/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 2.5553481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:19,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.44116 samples/s/p 4:26:33 } +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 499/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.5548994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43848 samples/s/p 4:26:38 } +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 501/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.5544505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43457 samples/s/p 4:26:47 } +2024-07-25 20:42:28,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 503/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.554001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:28,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.44012 samples/s/p 4:26:27 } +2024-07-25 20:42:31,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 505/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.5535512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43303 samples/s/p 4:26:45 } +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 507/ 1625], loss: 1.000, per_step_time: 1473ms, lr: 2.5531017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:34,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.42994 samples/s/p 4:26:51 } +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 509/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.5526517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43176 samples/s/p 4:26:43 } +2024-07-25 20:42:40,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 511/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 2.5522017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:40,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43035 samples/s/p 4:26:44 } +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 513/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.5517515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43960 samples/s/p 4:26:14 } +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 515/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.5513009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43851 samples/s/p 4:26:14 } +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 517/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.5508501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43268 samples/s/p 4:26:29 } +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 519/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5503994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:52,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43431 samples/s/p 4:26:21 } +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 521/ 1625], loss: 1.062, per_step_time: 1469ms, lr: 2.5499483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.44236 samples/s/p 4:25:54 } +2024-07-25 20:42:57,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 523/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.5494972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:57,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43425 samples/s/p 4:26:15 } +2024-07-25 20:43:00,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 525/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.5490457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:00,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43258 samples/s/p 4:26:17 } +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 527/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 2.548594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43047 samples/s/p 4:26:20 } +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 529/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.5481426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43886 samples/s/p 4:25:53 } +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 531/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.5476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43818 samples/s/p 4:25:52 } +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 533/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.5472384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43698 samples/s/p 4:25:52 } +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 535/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.5467862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43958 samples/s/p 4:25:42 } +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 537/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.5463336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43584 samples/s/p 4:25:50 } +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 539/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.5458809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43718 samples/s/p 4:25:43 } +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 541/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.545428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43405 samples/s/p 4:25:49 } +2024-07-25 20:43:27,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 543/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.544975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43903 samples/s/p 4:25:32 } +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 545/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 2.5445217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42964 samples/s/p 4:25:56 } +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 547/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.5440682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43287 samples/s/p 4:25:44 } +2024-07-25 20:43:36,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 549/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.5436146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43008 samples/s/p 4:25:49 } +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 551/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.543161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43623 samples/s/p 4:25:28 } +2024-07-25 20:43:42,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 553/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.5427067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43150 samples/s/p 4:25:39 } +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 555/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.5422527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43758 samples/s/p 4:25:18 } +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 557/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.5417983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43561 samples/s/p 4:25:21 } +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 559/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.5413437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43039 samples/s/p 4:25:34 } +2024-07-25 20:43:54,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 561/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 2.540889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:54,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44321 samples/s/p 4:24:53 } +2024-07-25 20:43:57,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 563/ 1625], loss: 1.052, per_step_time: 1473ms, lr: 2.540434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:57,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42794 samples/s/p 4:25:35 } +2024-07-25 20:43:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 565/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5399791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:59,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43297 samples/s/p 4:25:17 } +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 567/ 1625], loss: 1.009, per_step_time: 1473ms, lr: 2.5395238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43014 samples/s/p 4:25:22 } +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 569/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.5390684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43480 samples/s/p 4:25:06 } +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 571/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.5386127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44044 samples/s/p 4:24:46 } +2024-07-25 20:44:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 573/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.5381569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:11,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43560 samples/s/p 4:24:58 } +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 575/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.5377009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43480 samples/s/p 4:24:57 } +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 577/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5372448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43859 samples/s/p 4:24:43 } +2024-07-25 20:44:20,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 579/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.5367885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:20,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43933 samples/s/p 4:24:38 } +2024-07-25 20:44:23,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 581/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.5363319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:23,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43578 samples/s/p 4:24:45 } +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 583/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.5358753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43393 samples/s/p 4:24:48 } +2024-07-25 20:44:29,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 585/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.5354186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:29,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43509 samples/s/p 4:24:41 } +2024-07-25 20:44:32,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 587/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.5349613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:32,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43356 samples/s/p 4:24:43 } +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 589/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5345042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43212 samples/s/p 4:24:44 } +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 591/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5340469e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43147 samples/s/p 4:24:43 } +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 593/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.533589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.42949 samples/s/p 4:24:46 } +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 595/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.5331314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43159 samples/s/p 4:24:37 } +2024-07-25 20:44:47,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 597/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5326734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:47,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.44000 samples/s/p 4:24:09 } +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 599/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5322151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43365 samples/s/p 4:24:25 } +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 601/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.5317566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.44052 samples/s/p 4:24:02 } +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 603/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.531298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43969 samples/s/p 4:24:02 } +2024-07-25 20:44:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 605/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.5308394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:58,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43413 samples/s/p 4:24:15 } +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 607/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.5303805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43773 samples/s/p 4:24:01 } +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 609/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.5299214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43862 samples/s/p 4:23:56 } +2024-07-25 20:45:07,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 611/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.5294623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:07,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43528 samples/s/p 4:24:03 } +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 613/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.5290028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43260 samples/s/p 4:24:08 } +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 615/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.5285432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43825 samples/s/p 4:23:48 } +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 617/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.5280837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44049 samples/s/p 4:23:39 } +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.5276235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43601 samples/s/p 4:23:49 } +2024-07-25 20:45:22,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 621/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.527163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:22,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43924 samples/s/p 4:23:36 } +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 623/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.526703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:25,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44463 samples/s/p 4:23:18 } +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 625/ 1625], loss: 1.311, per_step_time: 1469ms, lr: 2.5262425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44510 samples/s/p 4:23:14 } +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 627/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.525782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:31,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43761 samples/s/p 4:23:32 } +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 629/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.525321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42781 samples/s/p 4:23:58 } +2024-07-25 20:45:37,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 631/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.52486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:37,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43566 samples/s/p 4:23:32 } +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 633/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 2.5243986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42878 samples/s/p 4:23:49 } +2024-07-25 20:45:43,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 635/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.5239373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:43,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43849 samples/s/p 4:23:18 } +2024-07-25 20:45:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 637/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 2.5234756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:46,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.44064 samples/s/p 4:23:09 } +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 639/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.523014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.44067 samples/s/p 4:23:06 } +2024-07-25 20:45:52,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 641/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 2.522552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42636 samples/s/p 4:23:44 } +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 643/ 1625], loss: 0.997, per_step_time: 1473ms, lr: 2.5220897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.42890 samples/s/p 4:23:34 } +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 645/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.5216274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43083 samples/s/p 4:23:26 } +2024-07-25 20:46:00,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 647/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.521165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:00,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43367 samples/s/p 4:23:14 } +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 649/ 1625], loss: 1.322, per_step_time: 1472ms, lr: 2.5207022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43194 samples/s/p 4:23:16 } +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 651/ 1625], loss: 1.077, per_step_time: 1470ms, lr: 2.5202393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:06,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44018 samples/s/p 4:22:50 } +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 653/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.5197764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.43129 samples/s/p 4:23:12 } +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 655/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 2.519313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44011 samples/s/p 4:22:44 } +2024-07-25 20:46:15,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 657/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.5188498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44126 samples/s/p 4:22:38 } +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 659/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.5183861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:18,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43473 samples/s/p 4:22:54 } +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 661/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5179223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43566 samples/s/p 4:22:48 } +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 663/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.5174584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43878 samples/s/p 4:22:36 } +2024-07-25 20:46:27,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 665/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.5169942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.44111 samples/s/p 4:22:26 } +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 667/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.51653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43503 samples/s/p 4:22:41 } +2024-07-25 20:46:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 669/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.5160656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43074 samples/s/p 4:22:50 } +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 671/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.5156009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.42776 samples/s/p 4:22:56 } +2024-07-25 20:46:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 673/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.5151363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43367 samples/s/p 4:22:36 } +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 675/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.5146714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43986 samples/s/p 4:22:15 } +2024-07-25 20:46:45,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 677/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.514206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:45,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43744 samples/s/p 4:22:19 } +2024-07-25 20:46:48,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 679/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.5137408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:48,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42988 samples/s/p 4:22:38 } +2024-07-25 20:46:51,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 681/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.5132751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:51,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43836 samples/s/p 4:22:11 } +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 683/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.5128094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:54,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42782 samples/s/p 4:22:38 } +2024-07-25 20:46:56,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 685/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.5123436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:56,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43286 samples/s/p 4:22:21 } +2024-07-25 20:46:59,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 687/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.5118774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:59,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43208 samples/s/p 4:22:20 } +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 689/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.5114114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:02,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43892 samples/s/p 4:21:57 } +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 691/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.510945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:05,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43503 samples/s/p 4:22:06 } +2024-07-25 20:47:08,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 693/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.5104782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:08,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43411 samples/s/p 4:22:05 } +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 695/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.5100115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:11,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43161 samples/s/p 4:22:10 } +2024-07-25 20:47:14,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 697/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.5095445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:14,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43618 samples/s/p 4:21:53 } +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 699/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.5090774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43644 samples/s/p 4:21:50 } +2024-07-25 20:47:20,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 701/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.50861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:20,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43533 samples/s/p 4:21:50 } +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 703/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.5081426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43937 samples/s/p 4:21:35 } +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 705/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.5076748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43581 samples/s/p 4:21:43 } +2024-07-25 20:47:29,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 707/ 1625], loss: 0.862, per_step_time: 1472ms, lr: 2.5072073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43430 samples/s/p 4:21:44 } +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 709/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.5067391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42719 samples/s/p 4:22:02 } +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 711/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 2.506271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:35,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43913 samples/s/p 4:21:24 } +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 713/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.5058027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:38,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42920 samples/s/p 4:21:50 } +2024-07-25 20:47:41,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 715/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.5053341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:41,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43412 samples/s/p 4:21:33 } +2024-07-25 20:47:44,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 717/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.5048654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:44,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43712 samples/s/p 4:21:21 } +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 719/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5043966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:47,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42974 samples/s/p 4:21:40 } +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 721/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.5039275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43255 samples/s/p 4:21:29 } +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 723/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5034584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:53,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43235 samples/s/p 4:21:26 } +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 725/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.5029889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:56,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.42954 samples/s/p 4:21:31 } +2024-07-25 20:47:56,025 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 727/ 1625], loss: 1.002, per_step_time: 2123ms, lr: 2.5025192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 3.76667 samples/s/p 6:16:55 } +2024-07-25 20:48:34,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 729/ 1625], loss: 0.904, per_step_time: 1471ms, lr: 2.5020494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:34,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43479 samples/s/p 4:21:10 } +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 731/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 2.5015794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.44085 samples/s/p 4:20:50 } +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 733/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.5011092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43484 samples/s/p 4:21:04 } +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 735/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.5006391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:42,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43614 samples/s/p 4:20:58 } +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 737/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.5001686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43527 samples/s/p 4:20:57 } +2024-07-25 20:48:48,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 739/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.4996976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43584 samples/s/p 4:20:53 } +2024-07-25 20:48:51,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 741/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.499227e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43351 samples/s/p 4:20:56 } +2024-07-25 20:48:54,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 743/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 2.498756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:54,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.44032 samples/s/p 4:20:34 } +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 745/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.4982848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43182 samples/s/p 4:20:55 } +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 747/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.4978135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43829 samples/s/p 4:20:34 } +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 749/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.4973418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43682 samples/s/p 4:20:35 } +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 751/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4968702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43801 samples/s/p 4:20:29 } +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 753/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.4963983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.42941 samples/s/p 4:20:51 } +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 755/ 1625], loss: 0.919, per_step_time: 1471ms, lr: 2.4959261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43684 samples/s/p 4:20:26 } +2024-07-25 20:49:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 757/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.495454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:15,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.42783 samples/s/p 4:20:49 } +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 759/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.4949815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43753 samples/s/p 4:20:18 } +2024-07-25 20:49:21,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 761/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.4945093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:21,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44078 samples/s/p 4:20:06 } +2024-07-25 20:49:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 763/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4940364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:25,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43715 samples/s/p 4:20:14 } +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 765/ 1625], loss: 1.161, per_step_time: 1468ms, lr: 2.4935633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44599 samples/s/p 4:19:45 } +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 767/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.4930905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:30,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43603 samples/s/p 4:20:11 } +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 769/ 1625], loss: 1.214, per_step_time: 1470ms, lr: 2.4926172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:33,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43993 samples/s/p 4:19:57 } +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 771/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.4921437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:36,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43485 samples/s/p 4:20:08 } +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 773/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.49167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43576 samples/s/p 4:20:03 } +2024-07-25 20:49:42,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 775/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.4911962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:42,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43369 samples/s/p 4:20:06 } +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 777/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.4907225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43751 samples/s/p 4:19:52 } +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 779/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.4902482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43341 samples/s/p 4:20:01 } +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 781/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.4897738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43631 samples/s/p 4:19:49 } +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 783/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.4892994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:54,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43635 samples/s/p 4:19:46 } +2024-07-25 20:49:57,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 785/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.4888246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:57,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43951 samples/s/p 4:19:34 } +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 787/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.4883499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43032 samples/s/p 4:19:58 } +2024-07-25 20:50:03,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 789/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 2.4878751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:03,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44106 samples/s/p 4:19:24 } +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 791/ 1625], loss: 1.425, per_step_time: 1471ms, lr: 2.4873994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43715 samples/s/p 4:19:32 } +2024-07-25 20:50:09,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 793/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4869241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:09,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.42867 samples/s/p 4:19:54 } +2024-07-25 20:50:12,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 795/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.486449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:12,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43828 samples/s/p 4:19:23 } +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 797/ 1625], loss: 1.012, per_step_time: 1863ms, lr: 2.4859732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 4.29208 samples/s/p 5:28:36 } +2024-07-25 20:50:18,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 799/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.4854971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:18,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44237 samples/s/p 4:19:06 } +2024-07-25 20:50:21,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 801/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.4850215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:21,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43443 samples/s/p 4:19:25 } +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 803/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.484545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43363 samples/s/p 4:19:25 } +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 805/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.4840687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43668 samples/s/p 4:19:13 } +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 807/ 1625], loss: 1.324, per_step_time: 1474ms, lr: 2.4835923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42505 samples/s/p 4:19:44 } +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 809/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 2.4831155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42957 samples/s/p 4:19:28 } +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 811/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.4826384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42920 samples/s/p 4:19:26 } +2024-07-25 20:50:39,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 813/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4821613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42771 samples/s/p 4:19:27 } +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 815/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.4816842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:42,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43542 samples/s/p 4:19:02 } +2024-07-25 20:50:45,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 817/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.4812067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:45,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42944 samples/s/p 4:19:16 } +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 819/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.480729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:48,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43349 samples/s/p 4:19:02 } +2024-07-25 20:50:51,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 821/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.4802514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:51,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43758 samples/s/p 4:18:47 } +2024-07-25 20:50:54,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 823/ 1625], loss: 1.107, per_step_time: 1470ms, lr: 2.4797733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:54,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43866 samples/s/p 4:18:41 } +2024-07-25 20:50:57,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 825/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 2.4792951e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:57,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43087 samples/s/p 4:19:00 } +2024-07-25 20:51:00,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 827/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.478817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:00,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43933 samples/s/p 4:18:33 } +2024-07-25 20:51:03,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 829/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 2.4783385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:03,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.42921 samples/s/p 4:18:59 } +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 831/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.4778597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:06,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43309 samples/s/p 4:18:45 } +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 833/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.477381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43145 samples/s/p 4:18:47 } +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 835/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 2.476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43131 samples/s/p 4:18:44 } +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 837/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.476423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42606 samples/s/p 4:18:56 } +2024-07-25 20:51:18,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 839/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 2.4759434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:18,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43689 samples/s/p 4:18:22 } +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 841/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.4754641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43551 samples/s/p 4:18:23 } +2024-07-25 20:51:23,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 843/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.4749845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:23,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43564 samples/s/p 4:18:20 } +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 845/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.474505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42618 samples/s/p 4:18:44 } +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 847/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.4740246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43505 samples/s/p 4:18:16 } +2024-07-25 20:51:32,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 849/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4735444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:32,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.44119 samples/s/p 4:17:56 } +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 851/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 2.4730645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42810 samples/s/p 4:18:30 } +2024-07-25 20:51:38,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 853/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.472584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:38,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42977 samples/s/p 4:18:22 } +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 855/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 2.472103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43848 samples/s/p 4:17:54 } +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 857/ 1625], loss: 1.369, per_step_time: 1470ms, lr: 2.4716222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:44,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43986 samples/s/p 4:17:48 } +2024-07-25 20:51:47,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 859/ 1625], loss: 1.313, per_step_time: 1470ms, lr: 2.4711413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.44013 samples/s/p 4:17:44 } +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 861/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.47066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43588 samples/s/p 4:17:53 } +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 863/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.4701789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43457 samples/s/p 4:17:54 } +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 865/ 1625], loss: 1.142, per_step_time: 1477ms, lr: 2.4696972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.41597 samples/s/p 4:18:44 } +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 867/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 2.4692155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43700 samples/s/p 4:17:41 } +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 869/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.4687335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43529 samples/s/p 4:17:43 } +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 871/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.4682515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43265 samples/s/p 4:17:47 } +2024-07-25 20:52:08,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 873/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 2.4677693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:08,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43090 samples/s/p 4:17:50 } +2024-07-25 20:52:11,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 875/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.467287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:11,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43262 samples/s/p 4:17:42 } +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 877/ 1625], loss: 1.386, per_step_time: 1473ms, lr: 2.4668043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43040 samples/s/p 4:17:45 } +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 879/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.4663217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42922 samples/s/p 4:17:45 } +2024-07-25 20:52:19,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 881/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.4658388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:20,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.44040 samples/s/p 4:17:11 } +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 883/ 1625], loss: 1.088, per_step_time: 1474ms, lr: 2.4653558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42543 samples/s/p 4:17:50 } +2024-07-25 20:52:25,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 885/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 2.4648729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43595 samples/s/p 4:17:17 } +2024-07-25 20:52:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 887/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.4643892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:28,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43125 samples/s/p 4:17:28 } +2024-07-25 20:52:31,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 889/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.463906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:31,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42893 samples/s/p 4:17:32 } +2024-07-25 20:52:34,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 891/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.4634222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:34,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43643 samples/s/p 4:17:07 } +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 893/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.4629384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43869 samples/s/p 4:16:58 } +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 895/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.4624542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43730 samples/s/p 4:16:59 } +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 897/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.46197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42914 samples/s/p 4:17:19 } +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 899/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.4614856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43318 samples/s/p 4:17:05 } +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 901/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.461001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43490 samples/s/p 4:16:57 } +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 903/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.4605162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:52,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.42989 samples/s/p 4:17:08 } +2024-07-25 20:52:55,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 905/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.4600313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:55,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43346 samples/s/p 4:16:55 } +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 907/ 1625], loss: 1.172, per_step_time: 1483ms, lr: 2.4595463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.39232 samples/s/p 4:18:50 } +2024-07-25 20:53:01,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 909/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.4590609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:01,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43574 samples/s/p 4:16:43 } +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 911/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.4585755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43049 samples/s/p 4:16:55 } +2024-07-25 20:53:07,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 913/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.45809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:07,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43483 samples/s/p 4:16:39 } +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 915/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.4576042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43575 samples/s/p 4:16:34 } +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 917/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.4571184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:13,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43254 samples/s/p 4:16:40 } +2024-07-25 20:53:16,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 919/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.4566321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:16,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43076 samples/s/p 4:16:42 } +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 921/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.456146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43377 samples/s/p 4:16:31 } +2024-07-25 20:53:22,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 923/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.4556595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:22,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43553 samples/s/p 4:16:23 } +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 925/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4551731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43557 samples/s/p 4:16:20 } +2024-07-25 20:53:27,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 927/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.4546864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:27,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43741 samples/s/p 4:16:12 } +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 929/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.4541992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43889 samples/s/p 4:16:04 } +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 931/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.4537121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.44218 samples/s/p 4:15:52 } +2024-07-25 20:53:36,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 933/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.453225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:36,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43783 samples/s/p 4:16:02 } +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 935/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.4527375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43551 samples/s/p 4:16:05 } +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 937/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.45225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43143 samples/s/p 4:16:14 } +2024-07-25 20:53:45,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 939/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4517623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:45,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43384 samples/s/p 4:16:04 } +2024-07-25 20:53:48,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 941/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.4512745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:48,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43648 samples/s/p 4:15:54 } +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 943/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.450786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43967 samples/s/p 4:15:42 } +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 945/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4502982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43410 samples/s/p 4:15:54 } +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 947/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.4498098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:57,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43776 samples/s/p 4:15:41 } +2024-07-25 20:54:00,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 949/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.449321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:00,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43365 samples/s/p 4:15:50 } +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 951/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.4488325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43189 samples/s/p 4:15:52 } +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 953/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.4483435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43500 samples/s/p 4:15:40 } +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 955/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.4478544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43296 samples/s/p 4:15:43 } +2024-07-25 20:54:12,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 957/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4473653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43785 samples/s/p 4:15:26 } +2024-07-25 20:54:15,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 959/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.4468758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:15,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43856 samples/s/p 4:15:21 } +2024-07-25 20:54:18,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 961/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.4463863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:18,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43289 samples/s/p 4:15:34 } +2024-07-25 20:54:21,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.4458963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:21,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43080 samples/s/p 4:15:37 } +2024-07-25 20:54:23,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 965/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.4454064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:23,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43016 samples/s/p 4:15:36 } +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 967/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.4449166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42806 samples/s/p 4:15:39 } +2024-07-25 20:54:29,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 969/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.444426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:29,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43244 samples/s/p 4:15:24 } +2024-07-25 20:54:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 971/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.443936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:32,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43469 samples/s/p 4:15:14 } +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 973/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.4434456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42810 samples/s/p 4:15:30 } +2024-07-25 20:54:38,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 975/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.4429548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:38,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43753 samples/s/p 4:15:01 } +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 977/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.4424635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44188 samples/s/p 4:14:45 } +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 979/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.4419727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43071 samples/s/p 4:15:14 } +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 981/ 1625], loss: 1.095, per_step_time: 1469ms, lr: 2.4414816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44351 samples/s/p 4:14:35 } +2024-07-25 20:54:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 983/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.4409901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43962 samples/s/p 4:14:43 } +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 985/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.4404984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43603 samples/s/p 4:14:50 } +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 987/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.440007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43434 samples/s/p 4:14:52 } +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 989/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.4395149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43449 samples/s/p 4:14:49 } +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 991/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.4390229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43681 samples/s/p 4:14:39 } +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 993/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.4385306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43652 samples/s/p 4:14:37 } +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 995/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.4380382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:08,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43202 samples/s/p 4:14:47 } +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 997/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4375458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43403 samples/s/p 4:14:38 } +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 999/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 2.437053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.42670 samples/s/p 4:14:56 } +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1001/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4365601e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43462 samples/s/p 4:14:30 } +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1003/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 2.4360672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43524 samples/s/p 4:14:26 } +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1005/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.4355739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43295 samples/s/p 4:14:29 } +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1007/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.4350806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:25,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43500 samples/s/p 4:14:21 } +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1009/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.434587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43224 samples/s/p 4:14:25 } +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1011/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4340932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:31,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43708 samples/s/p 4:14:09 } +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1013/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.4335995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.42807 samples/s/p 4:14:31 } +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1015/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.4331055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43496 samples/s/p 4:14:09 } +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1017/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.4326111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43570 samples/s/p 4:14:04 } +2024-07-25 20:55:43,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1019/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.432117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43219 samples/s/p 4:14:11 } +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1021/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.4316225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43188 samples/s/p 4:14:09 } +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1023/ 1625], loss: 1.379, per_step_time: 1470ms, lr: 2.431128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43894 samples/s/p 4:13:46 } +2024-07-25 20:55:52,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1025/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.4306331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43575 samples/s/p 4:13:52 } +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1027/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 2.430138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43165 samples/s/p 4:14:01 } +2024-07-25 20:55:58,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1029/ 1625], loss: 1.533, per_step_time: 1472ms, lr: 2.4296429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:58,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43441 samples/s/p 4:13:50 } +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1031/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.4291478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43579 samples/s/p 4:13:43 } +2024-07-25 20:56:04,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1033/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.428652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:04,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43559 samples/s/p 4:13:41 } +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1035/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.4281568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43788 samples/s/p 4:13:31 } +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1037/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.427661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43620 samples/s/p 4:13:33 } +2024-07-25 20:56:13,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1039/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.4271649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:13,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42805 samples/s/p 4:13:53 } +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1041/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.4266688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42884 samples/s/p 4:13:48 } +2024-07-25 20:56:19,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1043/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 2.4261724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43506 samples/s/p 4:13:27 } +2024-07-25 20:56:22,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1045/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.425676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:22,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.44023 samples/s/p 4:13:10 } +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1047/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.4251794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:24,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42795 samples/s/p 4:13:41 } +2024-07-25 20:56:27,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1049/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4246825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:27,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.44105 samples/s/p 4:13:02 } +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1051/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.4241855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:30,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43210 samples/s/p 4:13:24 } +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1053/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 2.4236884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:33,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43508 samples/s/p 4:13:13 } +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1055/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.4231913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:36,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43690 samples/s/p 4:13:05 } +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1057/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.422694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43669 samples/s/p 4:13:02 } +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1059/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.4221965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:42,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43485 samples/s/p 4:13:04 } +2024-07-25 20:56:45,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1061/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.421699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:45,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43655 samples/s/p 4:12:57 } +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1063/ 1625], loss: 1.396, per_step_time: 1471ms, lr: 2.421201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43742 samples/s/p 4:12:51 } +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1065/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4207025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43242 samples/s/p 4:13:02 } +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1067/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.4202047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43413 samples/s/p 4:12:55 } +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1069/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.4197063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43864 samples/s/p 4:12:39 } +2024-07-25 20:57:00,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1071/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.4192077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:00,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43711 samples/s/p 4:12:40 } +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1073/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 2.418709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43943 samples/s/p 4:12:31 } +2024-07-25 20:57:06,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1075/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.4182102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:06,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43203 samples/s/p 4:12:49 } +2024-07-25 20:57:09,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1077/ 1625], loss: 1.091, per_step_time: 1482ms, lr: 2.4177112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.39475 samples/s/p 4:14:31 } +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1079/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.417212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43466 samples/s/p 4:12:36 } +2024-07-25 20:57:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1081/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 2.4167124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:15,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44135 samples/s/p 4:12:14 } +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1083/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4162131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43883 samples/s/p 4:12:18 } +2024-07-25 20:57:21,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1085/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.4157134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:21,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44217 samples/s/p 4:12:06 } +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1087/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.4152136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:24,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43642 samples/s/p 4:12:19 } +2024-07-25 20:57:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1089/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.4147135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43255 samples/s/p 4:12:27 } +2024-07-25 20:57:29,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1091/ 1625], loss: 0.914, per_step_time: 1473ms, lr: 2.4142133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43096 samples/s/p 4:12:28 } +2024-07-25 20:57:32,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1093/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.413713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43510 samples/s/p 4:12:14 } +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1095/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.4132125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:35,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43752 samples/s/p 4:12:04 } +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1097/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 2.412712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43575 samples/s/p 4:12:06 } +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1099/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.4122113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43295 samples/s/p 4:12:11 } +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1101/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.4117102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43992 samples/s/p 4:11:49 } +2024-07-25 20:57:47,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1103/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 2.4112092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:47,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43821 samples/s/p 4:11:50 } +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1105/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.410708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43015 samples/s/p 4:12:10 } +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1107/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.4102066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.44088 samples/s/p 4:11:37 } +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1109/ 1625], loss: 1.166, per_step_time: 1475ms, lr: 2.409705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:56,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.42245 samples/s/p 4:12:25 } +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1111/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.4092036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43329 samples/s/p 4:11:52 } +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1113/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.4087014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43750 samples/s/p 4:11:38 } +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1115/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.4081994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:05,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43537 samples/s/p 4:11:41 } +2024-07-25 20:58:08,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1117/ 1625], loss: 1.232, per_step_time: 1483ms, lr: 2.4076973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:08,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.39195 samples/s/p 4:13:39 } +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1119/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.407195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43020 samples/s/p 4:11:49 } +2024-07-25 20:58:14,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1121/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4066921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:14,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43320 samples/s/p 4:11:38 } +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1123/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 2.40619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:17,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43005 samples/s/p 4:11:44 } +2024-07-25 20:58:20,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1125/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.4056868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:20,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.42903 samples/s/p 4:11:43 } +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1127/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.4051838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43576 samples/s/p 4:11:22 } +2024-07-25 20:58:26,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1129/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.4046809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:26,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.44145 samples/s/p 4:11:03 } +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1131/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.4041776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:28,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43646 samples/s/p 4:11:14 } +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1133/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.4036739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43559 samples/s/p 4:11:13 } +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1135/ 1625], loss: 1.205, per_step_time: 1469ms, lr: 2.4031702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.44255 samples/s/p 4:10:51 } +2024-07-25 20:58:37,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1137/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4026664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:37,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43927 samples/s/p 4:10:57 } +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1139/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.4021625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43980 samples/s/p 4:10:53 } +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1141/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.4016585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43782 samples/s/p 4:10:56 } +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1143/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.4011542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43294 samples/s/p 4:11:06 } +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1145/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.40065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43826 samples/s/p 4:10:48 } +2024-07-25 20:58:52,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1147/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.4001452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43177 samples/s/p 4:11:03 } +2024-07-25 20:58:55,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1149/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.3996405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:55,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43665 samples/s/p 4:10:47 } +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1151/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.3991359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43125 samples/s/p 4:10:59 } +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1153/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 2.3986307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.44023 samples/s/p 4:10:31 } +2024-07-25 20:59:04,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1155/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3981253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:04,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43383 samples/s/p 4:10:46 } +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1157/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.3976201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43169 samples/s/p 4:10:49 } +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1159/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.3971146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43874 samples/s/p 4:10:27 } +2024-07-25 20:59:13,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1161/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.3966091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:13,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43184 samples/s/p 4:10:43 } +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1163/ 1625], loss: 0.920, per_step_time: 1473ms, lr: 2.396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.42858 samples/s/p 4:10:49 } +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1165/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.3955972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:19,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43435 samples/s/p 4:10:30 } +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1167/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.3950912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43876 samples/s/p 4:10:15 } +2024-07-25 20:59:25,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1169/ 1625], loss: 0.966, per_step_time: 1470ms, lr: 2.3945848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:25,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44098 samples/s/p 4:10:06 } +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1171/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.3940784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44066 samples/s/p 4:10:04 } +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1173/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.3935718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43778 samples/s/p 4:10:09 } +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1175/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.393065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43309 samples/s/p 4:10:19 } +2024-07-25 20:59:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1177/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.3925579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43925 samples/s/p 4:09:59 } +2024-07-25 20:59:39,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1179/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.392051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:39,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43287 samples/s/p 4:10:13 } +2024-07-25 20:59:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1181/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3915436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43485 samples/s/p 4:10:05 } +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1183/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 2.3910365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:45,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43065 samples/s/p 4:10:14 } +2024-07-25 20:59:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1185/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.3905288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:48,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43804 samples/s/p 4:09:50 } +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1187/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.3900211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43860 samples/s/p 4:09:46 } +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1189/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.3895132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43980 samples/s/p 4:09:39 } +2024-07-25 20:59:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1191/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.3890052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42972 samples/s/p 4:10:04 } +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1193/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.3884972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43638 samples/s/p 4:09:43 } +2024-07-25 21:00:03,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1195/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.3879888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:03,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43840 samples/s/p 4:09:34 } +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1197/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.3874802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43585 samples/s/p 4:09:39 } +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1199/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.3869716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43567 samples/s/p 4:09:36 } +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1201/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.3864632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43225 samples/s/p 4:09:43 } +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1203/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3859538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43654 samples/s/p 4:09:28 } +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1205/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.3854449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43563 samples/s/p 4:09:27 } +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1207/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.3849358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43318 samples/s/p 4:09:31 } +2024-07-25 21:00:24,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1209/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.3844266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43614 samples/s/p 4:09:20 } +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1211/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.3839166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43754 samples/s/p 4:09:13 } +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1213/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.3834073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43154 samples/s/p 4:09:27 } +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1215/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.3828976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43507 samples/s/p 4:09:14 } +2024-07-25 21:00:35,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1217/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.3823872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:35,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43401 samples/s/p 4:09:14 } +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1219/ 1625], loss: 1.324, per_step_time: 1470ms, lr: 2.3818773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:38,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.44067 samples/s/p 4:08:53 } +2024-07-25 21:00:41,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1221/ 1625], loss: 1.435, per_step_time: 1473ms, lr: 2.3813669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:41,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43073 samples/s/p 4:09:17 } +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1223/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.3808565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43943 samples/s/p 4:08:50 } +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1225/ 1625], loss: 1.394, per_step_time: 1472ms, lr: 2.3803459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43326 samples/s/p 4:09:04 } +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1227/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.3798351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44177 samples/s/p 4:08:38 } +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1229/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.379324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43298 samples/s/p 4:08:59 } +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1231/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.378813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43535 samples/s/p 4:08:50 } +2024-07-25 21:00:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1233/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.3783017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43912 samples/s/p 4:08:37 } +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1235/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.3777904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43923 samples/s/p 4:08:33 } +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1237/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.3772787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44041 samples/s/p 4:08:27 } +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1239/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.3767674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44251 samples/s/p 4:08:19 } +2024-07-25 21:01:11,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1241/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.3762554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:11,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43740 samples/s/p 4:08:30 } +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.3757435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43369 samples/s/p 4:08:37 } +2024-07-25 21:01:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3752315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:17,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42968 samples/s/p 4:08:45 } +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1247/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.374719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42758 samples/s/p 4:08:48 } +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1249/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.3742066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43211 samples/s/p 4:08:32 } +2024-07-25 21:01:25,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1251/ 1625], loss: 1.154, per_step_time: 1469ms, lr: 2.373694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:25,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44282 samples/s/p 4:08:00 } +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1253/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 2.3731813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43392 samples/s/p 4:08:21 } +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1255/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 2.3726683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44399 samples/s/p 4:07:51 } +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1257/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.3721554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43675 samples/s/p 4:08:08 } +2024-07-25 21:01:37,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1259/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.371642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43540 samples/s/p 4:08:09 } +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.3711285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.44032 samples/s/p 4:07:52 } +2024-07-25 21:01:43,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1263/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.3706152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:43,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43192 samples/s/p 4:08:12 } +2024-07-25 21:01:46,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1265/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.3701015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:46,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43349 samples/s/p 4:08:05 } +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1267/ 1625], loss: 1.050, per_step_time: 1474ms, lr: 2.3695877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.42496 samples/s/p 4:08:25 } +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1269/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.3690738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43371 samples/s/p 4:07:58 } +2024-07-25 21:01:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1271/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3685594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:55,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43382 samples/s/p 4:07:55 } +2024-07-25 21:01:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1273/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.3680452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:58,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43147 samples/s/p 4:07:59 } +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1275/ 1625], loss: 0.887, per_step_time: 1470ms, lr: 2.3675308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.44175 samples/s/p 4:07:28 } +2024-07-25 21:02:04,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1277/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.3670162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:04,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43054 samples/s/p 4:07:55 } +2024-07-25 21:02:07,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1279/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.3665016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:07,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43847 samples/s/p 4:07:31 } +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1281/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 2.3659866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43706 samples/s/p 4:07:32 } +2024-07-25 21:02:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1283/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.3654715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43284 samples/s/p 4:07:40 } +2024-07-25 21:02:16,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1285/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.3649563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43856 samples/s/p 4:07:22 } +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1287/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 2.364441e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:19,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43307 samples/s/p 4:07:34 } +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1289/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.3639259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43600 samples/s/p 4:07:23 } +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1291/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.36341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43771 samples/s/p 4:07:15 } +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1293/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.3628942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43961 samples/s/p 4:07:07 } +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1295/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.3623785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43638 samples/s/p 4:07:13 } +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1297/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.3618622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43396 samples/s/p 4:07:17 } +2024-07-25 21:02:36,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1299/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.3613458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:36,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43407 samples/s/p 4:07:13 } +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1301/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.3608296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43192 samples/s/p 4:07:16 } +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1303/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.3603132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:42,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43348 samples/s/p 4:07:09 } +2024-07-25 21:02:45,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1305/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.3597966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43255 samples/s/p 4:07:09 } +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1307/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.3592798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.42792 samples/s/p 4:07:18 } +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1309/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.3587627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43319 samples/s/p 4:07:01 } +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1311/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.3582457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:54,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43222 samples/s/p 4:07:01 } +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1313/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.3577282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43027 samples/s/p 4:07:03 } +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.3572107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43657 samples/s/p 4:06:43 } +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1317/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3566932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43382 samples/s/p 4:06:48 } +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1319/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 2.3561757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43087 samples/s/p 4:06:53 } +2024-07-25 21:03:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1321/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3556577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:09,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43718 samples/s/p 4:06:32 } +2024-07-25 21:03:12,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1323/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.35514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:12,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43401 samples/s/p 4:06:38 } +2024-07-25 21:03:15,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1325/ 1625], loss: 0.985, per_step_time: 1472ms, lr: 2.3546214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:15,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43362 samples/s/p 4:06:36 } +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1327/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 2.3541032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.42551 samples/s/p 4:06:55 } +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1329/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.353585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43298 samples/s/p 4:06:32 } +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1331/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.3530665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:24,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43875 samples/s/p 4:06:13 } +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1333/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.3525474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:26,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43843 samples/s/p 4:06:11 } +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1335/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.3520286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43520 samples/s/p 4:06:17 } +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1337/ 1625], loss: 1.373, per_step_time: 1471ms, lr: 2.3515096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43582 samples/s/p 4:06:13 } +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1339/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.3509905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43338 samples/s/p 4:06:16 } +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1341/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.350471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43689 samples/s/p 4:06:04 } +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1343/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3499517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43458 samples/s/p 4:06:07 } +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1345/ 1625], loss: 1.059, per_step_time: 1474ms, lr: 2.3494318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.42379 samples/s/p 4:06:34 } +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1347/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.3489121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:47,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43942 samples/s/p 4:05:48 } +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1349/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.348392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43206 samples/s/p 4:06:05 } +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1351/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.347872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43331 samples/s/p 4:05:59 } +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1353/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.3473518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.44050 samples/s/p 4:05:36 } +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1355/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 2.3468312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43112 samples/s/p 4:05:59 } +2024-07-25 21:04:02,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1357/ 1625], loss: 1.483, per_step_time: 1471ms, lr: 2.346311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43542 samples/s/p 4:05:44 } +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1359/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3457902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43273 samples/s/p 4:05:49 } +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1361/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.3452694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43619 samples/s/p 4:05:36 } +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1363/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.3447485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43550 samples/s/p 4:05:35 } +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1365/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.3442273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43555 samples/s/p 4:05:32 } +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1367/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.343706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43092 samples/s/p 4:05:42 } +2024-07-25 21:04:20,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1369/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.3431845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:20,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.42834 samples/s/p 4:05:46 } +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1371/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.342663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43271 samples/s/p 4:05:31 } +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1373/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.3421413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43205 samples/s/p 4:05:30 } +2024-07-25 21:04:28,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1375/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 2.3416194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:28,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42610 samples/s/p 4:05:43 } +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1377/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.3410974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.44029 samples/s/p 4:05:02 } +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1379/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 2.3405755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:34,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42627 samples/s/p 4:05:37 } +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1381/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.340053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43905 samples/s/p 4:04:59 } +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1383/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.3395305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43441 samples/s/p 4:05:09 } +2024-07-25 21:04:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1385/ 1625], loss: 1.235, per_step_time: 1470ms, lr: 2.3390083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.44089 samples/s/p 4:04:48 } +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1387/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.3384853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43997 samples/s/p 4:04:48 } +2024-07-25 21:04:49,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1389/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.3379625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:49,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43027 samples/s/p 4:05:11 } +2024-07-25 21:04:52,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1391/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.3374394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:52,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43657 samples/s/p 4:04:51 } +2024-07-25 21:04:55,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1393/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.3369164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43721 samples/s/p 4:04:46 } +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1395/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.336393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:58,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42980 samples/s/p 4:05:04 } +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1397/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.3358696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:01,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43322 samples/s/p 4:04:51 } +2024-07-25 21:05:04,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1399/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.3353461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:04,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43598 samples/s/p 4:04:41 } +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1401/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.334822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43065 samples/s/p 4:04:52 } +2024-07-25 21:05:10,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1403/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.3342984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:10,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42714 samples/s/p 4:04:59 } +2024-07-25 21:05:13,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1405/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.3337743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:13,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43041 samples/s/p 4:04:47 } +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1407/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.3332504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43255 samples/s/p 4:04:38 } +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1409/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.3327257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43142 samples/s/p 4:04:39 } +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1411/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.3322013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43741 samples/s/p 4:04:19 } +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1413/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.3316768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43257 samples/s/p 4:04:30 } +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1415/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 2.3311522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44155 samples/s/p 4:04:02 } +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1417/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.3306273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43271 samples/s/p 4:04:23 } +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1419/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.3301021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:33,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43937 samples/s/p 4:04:02 } +2024-07-25 21:05:36,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1421/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.329577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:36,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43194 samples/s/p 4:04:19 } +2024-07-25 21:05:39,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1423/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.3290517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:39,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43751 samples/s/p 4:04:01 } +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1425/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.3285264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43783 samples/s/p 4:03:58 } +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1427/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 2.3280007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43079 samples/s/p 4:04:14 } +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1429/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.3274748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43384 samples/s/p 4:04:03 } +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1431/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 2.326949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.42487 samples/s/p 4:04:24 } +2024-07-25 21:05:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1433/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.3264229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:54,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43451 samples/s/p 4:03:55 } +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1435/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.3258966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43575 samples/s/p 4:03:49 } +2024-07-25 21:06:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1437/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.3253704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:00,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43161 samples/s/p 4:03:57 } +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1439/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.324844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43013 samples/s/p 4:03:58 } +2024-07-25 21:06:06,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1441/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.324317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43546 samples/s/p 4:03:41 } +2024-07-25 21:06:09,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1443/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3237904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:09,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43348 samples/s/p 4:03:43 } +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1445/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.3232637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.42583 samples/s/p 4:04:01 } +2024-07-25 21:06:15,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1447/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.3227365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:15,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43422 samples/s/p 4:03:35 } +2024-07-25 21:06:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1449/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 2.3222094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:18,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43125 samples/s/p 4:03:40 } +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1451/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 2.321682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43178 samples/s/p 4:03:36 } +2024-07-25 21:06:24,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1453/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3211544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:24,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43356 samples/s/p 4:03:28 } +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1455/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.3206267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43244 samples/s/p 4:03:28 } +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1457/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.3200992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43497 samples/s/p 4:03:18 } +2024-07-25 21:06:32,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1459/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.3195713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:32,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43062 samples/s/p 4:03:27 } +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1461/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.319043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43603 samples/s/p 4:03:10 } +2024-07-25 21:06:38,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1463/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.3185148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:38,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43677 samples/s/p 4:03:05 } +2024-07-25 21:06:41,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1465/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.3179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:41,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.44384 samples/s/p 4:02:43 } +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1467/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.317458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43363 samples/s/p 4:03:07 } +2024-07-25 21:06:47,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1469/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.3169294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:47,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43384 samples/s/p 4:03:04 } +2024-07-25 21:06:50,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1471/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.3164008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:50,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43524 samples/s/p 4:02:57 } +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1473/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.3158722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43731 samples/s/p 4:02:48 } +2024-07-25 21:06:56,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1475/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.3153427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:56,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43156 samples/s/p 4:03:01 } +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1477/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.3148137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:59,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43545 samples/s/p 4:02:48 } +2024-07-25 21:07:02,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1479/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.3142846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:02,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.42775 samples/s/p 4:03:05 } +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1481/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.313755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43820 samples/s/p 4:02:34 } +2024-07-25 21:07:08,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1483/ 1625], loss: 0.946, per_step_time: 1470ms, lr: 2.3132252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:08,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43982 samples/s/p 4:02:27 } +2024-07-25 21:07:11,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1485/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.3126957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:11,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43830 samples/s/p 4:02:28 } +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1487/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3121658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:14,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42901 samples/s/p 4:02:50 } +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1489/ 1625], loss: 0.995, per_step_time: 1472ms, lr: 2.3116358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43367 samples/s/p 4:02:35 } +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1491/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 2.3111055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43323 samples/s/p 4:02:33 } +2024-07-25 21:07:23,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1493/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.3105753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:23,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43140 samples/s/p 4:02:35 } +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1495/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.310045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43838 samples/s/p 4:02:13 } +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1497/ 1625], loss: 0.863, per_step_time: 1473ms, lr: 2.3095143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42837 samples/s/p 4:02:37 } +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1499/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.3089835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43582 samples/s/p 4:02:14 } +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1501/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3084529e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43557 samples/s/p 4:02:12 } +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1503/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.307922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43598 samples/s/p 4:02:08 } +2024-07-25 21:07:40,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1505/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.3073904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:40,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43435 samples/s/p 4:02:09 } +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1507/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3068595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43713 samples/s/p 4:01:59 } +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1509/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.306328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43137 samples/s/p 4:02:11 } +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1511/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.3057966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:49,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43750 samples/s/p 4:01:52 } +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1513/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.3052648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.42997 samples/s/p 4:02:09 } +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1515/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3047329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43228 samples/s/p 4:02:00 } +2024-07-25 21:07:58,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1517/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.3042008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:58,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43297 samples/s/p 4:01:55 } +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1519/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3036688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43198 samples/s/p 4:01:55 } +2024-07-25 21:08:04,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1521/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.3031364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:04,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43768 samples/s/p 4:01:37 } +2024-07-25 21:08:07,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1523/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.302604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:07,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43669 samples/s/p 4:01:37 } +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1525/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3020715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43781 samples/s/p 4:01:31 } +2024-07-25 21:08:13,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1527/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.301539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:13,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43666 samples/s/p 4:01:31 } +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1529/ 1625], loss: 1.072, per_step_time: 1473ms, lr: 2.301006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43030 samples/s/p 4:01:45 } +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1531/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.300473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43484 samples/s/p 4:01:30 } +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1533/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.29994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43142 samples/s/p 4:01:36 } +2024-07-25 21:08:25,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1535/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 2.2994067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:25,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43605 samples/s/p 4:01:21 } +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1537/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.2988734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43839 samples/s/p 4:01:11 } +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1539/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.2983397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:30,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43548 samples/s/p 4:01:16 } +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1541/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.2978062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.42659 samples/s/p 4:01:37 } +2024-07-25 21:08:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1543/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.2972723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:36,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43200 samples/s/p 4:01:20 } +2024-07-25 21:08:39,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1545/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 2.2967384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:39,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43320 samples/s/p 4:01:13 } +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1547/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2962042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43739 samples/s/p 4:00:59 } +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1549/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.2956701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43697 samples/s/p 4:00:58 } +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1551/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.2951357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:48,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43748 samples/s/p 4:00:53 } +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1553/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.2946011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42611 samples/s/p 4:01:21 } +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1555/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.2940667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43416 samples/s/p 4:00:56 } +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1557/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 2.2935319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43669 samples/s/p 4:00:47 } +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1559/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.2929971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43575 samples/s/p 4:00:46 } +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1561/ 1625], loss: 1.404, per_step_time: 1473ms, lr: 2.292462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42900 samples/s/p 4:01:01 } +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1563/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.2919272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:06,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43400 samples/s/p 4:00:45 } +2024-07-25 21:09:09,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1565/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.2913915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:09,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43492 samples/s/p 4:00:39 } +2024-07-25 21:09:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1567/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.2908564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43453 samples/s/p 4:00:38 } +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1569/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.2903208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43248 samples/s/p 4:00:40 } +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1571/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.2897852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43222 samples/s/p 4:00:38 } +2024-07-25 21:09:21,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1573/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.2892493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43216 samples/s/p 4:00:35 } +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1575/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.288713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:24,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43731 samples/s/p 4:00:18 } +2024-07-25 21:09:27,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1577/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.2881772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:27,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43643 samples/s/p 4:00:18 } +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1579/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.2876407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43200 samples/s/p 4:00:27 } +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1581/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.2871045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43069 samples/s/p 4:00:27 } +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1583/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.286568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43415 samples/s/p 4:00:15 } +2024-07-25 21:09:38,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1585/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2860315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:38,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43568 samples/s/p 4:00:08 } +2024-07-25 21:09:41,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1587/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.2854943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:41,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43620 samples/s/p 4:00:04 } +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1589/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2849577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43011 samples/s/p 4:00:17 } +2024-07-25 21:09:47,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1591/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2844208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:47,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43711 samples/s/p 3:59:55 } +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1593/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.2838836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43626 samples/s/p 3:59:55 } +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1595/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.283346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:53,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43886 samples/s/p 3:59:45 } +2024-07-25 21:09:56,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1597/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.2828086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43436 samples/s/p 3:59:54 } +2024-07-25 21:09:59,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1599/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.282271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:59,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.44011 samples/s/p 3:59:36 } +2024-07-25 21:10:02,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1601/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.2817332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:02,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43734 samples/s/p 3:59:40 } +2024-07-25 21:10:05,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1603/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.2811953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:05,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43652 samples/s/p 3:59:39 } +2024-07-25 21:10:08,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1605/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.2806575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43889 samples/s/p 3:59:30 } +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1607/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.2801192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43270 samples/s/p 3:59:44 } +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1609/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.279581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.44155 samples/s/p 3:59:17 } +2024-07-25 21:10:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1611/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.2790426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:17,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43251 samples/s/p 3:59:38 } +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1613/ 1625], loss: 1.236, per_step_time: 1476ms, lr: 2.278504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.41918 samples/s/p 4:00:11 } +2024-07-25 21:10:23,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1615/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2779652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:23,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43703 samples/s/p 3:59:20 } +2024-07-25 21:10:26,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1617/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.2774264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:26,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43484 samples/s/p 3:59:23 } +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1619/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.2768874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43740 samples/s/p 3:59:13 } +2024-07-25 21:10:32,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1621/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 2.2763483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:32,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43478 samples/s/p 3:59:17 } +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.2758091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:34,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43472 samples/s/p 3:59:15 } +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1625/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 2.2752696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:37,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43812 samples/s/p 3:59:03 } +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 2/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.2747303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43574 samples/s/p 3:59:06 } +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 4/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.2741906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43448 samples/s/p 3:59:06 } +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 6/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.2736509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.42866 samples/s/p 3:59:19 } +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 8/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.2731108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43476 samples/s/p 3:59:00 } +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 10/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.2725708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:52,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43833 samples/s/p 3:58:47 } +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 12/ 1625], loss: 1.227, per_step_time: 1477ms, lr: 2.2720307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.41289 samples/s/p 3:59:52 } +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 14/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.2714903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43470 samples/s/p 3:58:51 } +2024-07-25 21:11:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 16/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.27095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42884 samples/s/p 3:59:04 } +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 18/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.2704093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:04,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43467 samples/s/p 3:58:45 } +2024-07-25 21:11:07,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 20/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.2698687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:07,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42887 samples/s/p 3:58:58 } +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 22/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.2693279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43986 samples/s/p 3:58:26 } +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 24/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.268787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43242 samples/s/p 3:58:42 } +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 26/ 1625], loss: 1.157, per_step_time: 1469ms, lr: 2.2682461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.44237 samples/s/p 3:58:13 } +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 28/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.2677044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43517 samples/s/p 3:58:29 } +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 30/ 1625], loss: 1.344, per_step_time: 1474ms, lr: 2.2671631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42673 samples/s/p 3:58:49 } +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 32/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.2666221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43340 samples/s/p 3:58:28 } +2024-07-25 21:11:28,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 34/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.2660804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:28,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43144 samples/s/p 3:58:30 } +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 36/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43561 samples/s/p 3:58:16 } +2024-07-25 21:11:33,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 38/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.2649967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:33,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42986 samples/s/p 3:58:29 } +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 40/ 1625], loss: 1.410, per_step_time: 1471ms, lr: 2.2644546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43815 samples/s/p 3:58:04 } +2024-07-25 21:11:39,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 42/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.2639124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43630 samples/s/p 3:58:06 } +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 44/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2633702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43866 samples/s/p 3:57:57 } +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 46/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.2628277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43901 samples/s/p 3:57:53 } +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 48/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.2622855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43632 samples/s/p 3:57:57 } +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 50/ 1625], loss: 1.264, per_step_time: 1474ms, lr: 2.2617425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42732 samples/s/p 3:58:18 } +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 52/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.2611997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42716 samples/s/p 3:58:15 } +2024-07-25 21:11:57,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 54/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2606571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43713 samples/s/p 3:57:46 } +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 56/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.260114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43248 samples/s/p 3:57:55 } +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 58/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.2595706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43636 samples/s/p 3:57:42 } +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 60/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.2590275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43273 samples/s/p 3:57:49 } +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 62/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.258484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:09,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43434 samples/s/p 3:57:41 } +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 64/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.2579403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43726 samples/s/p 3:57:31 } +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 66/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.2573966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43678 samples/s/p 3:57:29 } +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 68/ 1625], loss: 1.121, per_step_time: 1477ms, lr: 2.2568527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.41602 samples/s/p 3:58:21 } +2024-07-25 21:12:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 70/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2563088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43486 samples/s/p 3:57:28 } +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 72/ 1625], loss: 1.486, per_step_time: 1472ms, lr: 2.2557646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43330 samples/s/p 3:57:29 } +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 74/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.2552204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43112 samples/s/p 3:57:32 } +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 76/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.254676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43770 samples/s/p 3:57:12 } +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 78/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.2541315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43704 samples/s/p 3:57:11 } +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 80/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.2535869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43122 samples/s/p 3:57:23 } +2024-07-25 21:12:38,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 82/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.2530421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:38,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43531 samples/s/p 3:57:09 } +2024-07-25 21:12:41,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 84/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 2.2524971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:41,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43329 samples/s/p 3:57:12 } +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 86/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.2519522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43369 samples/s/p 3:57:08 } +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 88/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.251407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:47,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.42746 samples/s/p 3:57:21 } +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 90/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 2.2508617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.42477 samples/s/p 3:57:25 } +2024-07-25 21:12:53,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 92/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.2503164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43920 samples/s/p 3:56:45 } +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 94/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.2497707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43423 samples/s/p 3:56:55 } +2024-07-25 21:12:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 96/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2492251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:59,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43561 samples/s/p 3:56:48 } +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 98/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.2486793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43653 samples/s/p 3:56:43 } +2024-07-25 21:13:05,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 100/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.2481334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:05,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43642 samples/s/p 3:56:40 } +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 102/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2475871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43607 samples/s/p 3:56:38 } +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 104/ 1625], loss: 1.066, per_step_time: 1469ms, lr: 2.247041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.44222 samples/s/p 3:56:19 } +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 106/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2464947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43813 samples/s/p 3:56:27 } +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 108/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.245948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.44198 samples/s/p 3:56:14 } +2024-07-25 21:13:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 110/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.2454016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43052 samples/s/p 3:56:41 } +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 112/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.2448548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43782 samples/s/p 3:56:19 } +2024-07-25 21:13:26,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 114/ 1625], loss: 0.954, per_step_time: 1470ms, lr: 2.244308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:26,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43890 samples/s/p 3:56:13 } +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 116/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.2437613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.42980 samples/s/p 3:56:34 } +2024-07-25 21:13:32,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 118/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.243214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:32,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43039 samples/s/p 3:56:29 } +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 120/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.242667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43203 samples/s/p 3:56:22 } +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 122/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2421198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43332 samples/s/p 3:56:16 } +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 124/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.2415721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43749 samples/s/p 3:56:02 } +2024-07-25 21:13:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 126/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.2410246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42930 samples/s/p 3:56:20 } +2024-07-25 21:13:46,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 128/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2404767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:46,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43317 samples/s/p 3:56:07 } +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 130/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.239929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42824 samples/s/p 3:56:17 } +2024-07-25 21:13:52,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 132/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 2.2393811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:52,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43888 samples/s/p 3:55:47 } +2024-07-25 21:13:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 134/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.2388327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:55,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43653 samples/s/p 3:55:50 } +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 136/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 2.2382847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43246 samples/s/p 3:55:57 } +2024-07-25 21:14:01,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 138/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.2377366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:01,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43743 samples/s/p 3:55:41 } +2024-07-25 21:14:04,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 140/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.2371878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:04,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.44052 samples/s/p 3:55:30 } +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 142/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.2366394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:07,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43109 samples/s/p 3:55:52 } +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 144/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2360906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:10,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43315 samples/s/p 3:55:44 } +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 146/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.2355418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:13,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43494 samples/s/p 3:55:36 } +2024-07-25 21:14:16,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 148/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 2.2349928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:16,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43562 samples/s/p 3:55:31 } +2024-07-25 21:14:19,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 150/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2344437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43700 samples/s/p 3:55:25 } +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 152/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.2338943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43241 samples/s/p 3:55:34 } +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 154/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.233345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43878 samples/s/p 3:55:14 } +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 156/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.2327955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43307 samples/s/p 3:55:26 } +2024-07-25 21:14:31,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 158/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.232246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:31,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.42888 samples/s/p 3:55:34 } +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 160/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.2316963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43565 samples/s/p 3:55:14 } +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 162/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.2311464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43316 samples/s/p 3:55:17 } +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 164/ 1625], loss: 1.055, per_step_time: 1469ms, lr: 2.2305963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.44415 samples/s/p 3:54:46 } +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 166/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.230046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43284 samples/s/p 3:55:12 } +2024-07-25 21:14:45,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 168/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.229496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:45,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43000 samples/s/p 3:55:17 } +2024-07-25 21:14:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 170/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2289454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:48,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43677 samples/s/p 3:54:56 } +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 172/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.2283948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43012 samples/s/p 3:55:10 } +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 174/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2278444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44023 samples/s/p 3:54:41 } +2024-07-25 21:14:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 176/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.2272936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43421 samples/s/p 3:54:54 } +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 178/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.2267428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43560 samples/s/p 3:54:47 } +2024-07-25 21:15:03,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 180/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 2.2261916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:03,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44296 samples/s/p 3:54:25 } +2024-07-25 21:15:06,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 182/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2256405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:06,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43741 samples/s/p 3:54:37 } +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 184/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.2250892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:09,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43308 samples/s/p 3:54:45 } +2024-07-25 21:15:12,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 186/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 2.2245378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:12,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44317 samples/s/p 3:54:16 } +2024-07-25 21:15:15,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 188/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.2239865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:15,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43723 samples/s/p 3:54:28 } +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 190/ 1625], loss: 1.009, per_step_time: 1469ms, lr: 2.2234346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.44326 samples/s/p 3:54:10 } +2024-07-25 21:15:21,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 192/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.2228829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:21,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43514 samples/s/p 3:54:28 } +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 194/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.222331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43225 samples/s/p 3:54:32 } +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 196/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.2217791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43307 samples/s/p 3:54:27 } +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 198/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.2212269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:30,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43726 samples/s/p 3:54:14 } +2024-07-25 21:15:33,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 200/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 2.2206747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:33,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43482 samples/s/p 3:54:17 } +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 202/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.2201222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43038 samples/s/p 3:54:26 } +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 204/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.21957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:38,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43035 samples/s/p 3:54:23 } +2024-07-25 21:15:41,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 206/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2190172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.44206 samples/s/p 3:53:49 } +2024-07-25 21:15:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 208/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.2184644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43269 samples/s/p 3:54:11 } +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 210/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.2179118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43274 samples/s/p 3:54:08 } +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 212/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2173588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43626 samples/s/p 3:53:56 } +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 214/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 2.2168053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.42952 samples/s/p 3:54:10 } +2024-07-25 21:15:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 216/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2162525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43508 samples/s/p 3:53:53 } +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.2156992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43581 samples/s/p 3:53:48 } +2024-07-25 21:16:02,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 220/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.2151457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:02,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43782 samples/s/p 3:53:40 } +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 222/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.214592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43602 samples/s/p 3:53:42 } +2024-07-25 21:16:08,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 224/ 1625], loss: 0.893, per_step_time: 1471ms, lr: 2.2140382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:08,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43751 samples/s/p 3:53:35 } +2024-07-25 21:16:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 226/ 1625], loss: 1.085, per_step_time: 1470ms, lr: 2.2134847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43861 samples/s/p 3:53:29 } +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 228/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2129307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43400 samples/s/p 3:53:38 } +2024-07-25 21:16:17,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 230/ 1625], loss: 0.865, per_step_time: 1471ms, lr: 2.2123762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:17,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43481 samples/s/p 3:53:33 } +2024-07-25 21:16:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 232/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.2118224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43265 samples/s/p 3:53:35 } +2024-07-25 21:16:23,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 234/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.211268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:23,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43297 samples/s/p 3:53:32 } +2024-07-25 21:16:26,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 236/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.2107135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:26,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43316 samples/s/p 3:53:28 } +2024-07-25 21:16:29,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 238/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.210159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:29,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43675 samples/s/p 3:53:16 } +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 240/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.2096043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43638 samples/s/p 3:53:14 } +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 242/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.2090495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:35,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43628 samples/s/p 3:53:11 } +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 244/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.2084943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43766 samples/s/p 3:53:05 } +2024-07-25 21:16:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2079394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:40,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43497 samples/s/p 3:53:09 } +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 248/ 1625], loss: 1.072, per_step_time: 1472ms, lr: 2.2073842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43186 samples/s/p 3:53:14 } +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 250/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.2068289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43519 samples/s/p 3:53:02 } +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 252/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.2062733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43851 samples/s/p 3:52:51 } +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 254/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.2057178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42948 samples/s/p 3:53:11 } +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 256/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.2051621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43380 samples/s/p 3:52:57 } +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 258/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 2.2046064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:58,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42874 samples/s/p 3:53:07 } +2024-07-25 21:17:01,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 260/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.2040504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:01,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43630 samples/s/p 3:52:45 } +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 262/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.2034943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43362 samples/s/p 3:52:49 } +2024-07-25 21:17:07,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 264/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 2.2029382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43022 samples/s/p 3:52:55 } +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 266/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.2023818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43298 samples/s/p 3:52:45 } +2024-07-25 21:17:13,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 268/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2018256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:13,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43987 samples/s/p 3:52:24 } +2024-07-25 21:17:16,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 270/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.201269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:16,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43257 samples/s/p 3:52:40 } +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 272/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2007122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43969 samples/s/p 3:52:19 } +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 274/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.2001554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43829 samples/s/p 3:52:19 } +2024-07-25 21:17:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 276/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1995987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44114 samples/s/p 3:52:09 } +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 278/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.1990416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:28,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43682 samples/s/p 3:52:17 } +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 280/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.1984844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44133 samples/s/p 3:52:03 } +2024-07-25 21:17:34,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 282/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 2.1979271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:34,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43160 samples/s/p 3:52:25 } +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 284/ 1625], loss: 1.397, per_step_time: 1470ms, lr: 2.19737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43897 samples/s/p 3:52:03 } +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 286/ 1625], loss: 1.279, per_step_time: 1475ms, lr: 2.1968124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:39,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42159 samples/s/p 3:52:44 } +2024-07-25 21:17:42,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 288/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.1962549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43241 samples/s/p 3:52:14 } +2024-07-25 21:17:45,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 290/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.195697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:45,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43753 samples/s/p 3:51:58 } +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 292/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 2.1951395e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43863 samples/s/p 3:51:52 } +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 294/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.1945816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:51,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43255 samples/s/p 3:52:04 } +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 296/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.1940232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42828 samples/s/p 3:52:12 } +2024-07-25 21:17:57,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 298/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.1934653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:57,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43679 samples/s/p 3:51:48 } +2024-07-25 21:18:00,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 300/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.192907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43529 samples/s/p 3:51:49 } +2024-07-25 21:18:03,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 302/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.1923484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:03,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43468 samples/s/p 3:51:47 } +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 304/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.1917898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42860 samples/s/p 3:52:00 } +2024-07-25 21:18:09,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 306/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.1912314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:09,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43233 samples/s/p 3:51:47 } +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 308/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1906724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42850 samples/s/p 3:51:54 } +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 310/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.1901134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:15,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43400 samples/s/p 3:51:37 } +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 312/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.1895545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42787 samples/s/p 3:51:50 } +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 314/ 1625], loss: 1.071, per_step_time: 1477ms, lr: 2.1889953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.41463 samples/s/p 3:52:21 } +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 316/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.1884363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.44108 samples/s/p 3:51:10 } +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 318/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.1878766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43371 samples/s/p 3:51:26 } +2024-07-25 21:18:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 320/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.1873175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43030 samples/s/p 3:51:32 } +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 322/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.186758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43036 samples/s/p 3:51:29 } +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 324/ 1625], loss: 0.832, per_step_time: 1471ms, lr: 2.1861983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43494 samples/s/p 3:51:14 } +2024-07-25 21:18:38,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 326/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 2.1856382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:38,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43976 samples/s/p 3:50:59 } +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 328/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.1850783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43741 samples/s/p 3:51:02 } +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 330/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1845182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43339 samples/s/p 3:51:09 } +2024-07-25 21:18:47,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.183958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:47,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43529 samples/s/p 3:51:01 } +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 334/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.1833976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43591 samples/s/p 3:50:57 } +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 336/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.1828373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43997 samples/s/p 3:50:44 } +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 338/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.1822767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:56,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43822 samples/s/p 3:50:45 } +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 340/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.1817159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43492 samples/s/p 3:50:51 } +2024-07-25 21:19:02,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 342/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.1811553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:02,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43856 samples/s/p 3:50:38 } +2024-07-25 21:19:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 344/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.1805943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:05,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43787 samples/s/p 3:50:37 } +2024-07-25 21:19:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 346/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.1800332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43537 samples/s/p 3:50:41 } +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 348/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.1794722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43854 samples/s/p 3:50:30 } +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 350/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.1789108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43917 samples/s/p 3:50:25 } +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 352/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1783495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43511 samples/s/p 3:50:33 } +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 354/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.177788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:20,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43608 samples/s/p 3:50:27 } +2024-07-25 21:19:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 356/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.1772265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44152 samples/s/p 3:50:10 } +2024-07-25 21:19:26,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 358/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.1766646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:26,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43429 samples/s/p 3:50:26 } +2024-07-25 21:19:29,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 360/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.1761029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:29,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43472 samples/s/p 3:50:22 } +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 362/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 2.1755408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43075 samples/s/p 3:50:29 } +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 364/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.1749787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44014 samples/s/p 3:50:02 } +2024-07-25 21:19:37,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 366/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 2.1744167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:37,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43552 samples/s/p 3:50:11 } +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 368/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.1738544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44133 samples/s/p 3:49:53 } +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 370/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.173292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43559 samples/s/p 3:50:05 } +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 372/ 1625], loss: 0.984, per_step_time: 1469ms, lr: 2.1727295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44452 samples/s/p 3:49:39 } +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1721668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43491 samples/s/p 3:50:01 } +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 376/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.1716038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43291 samples/s/p 3:50:03 } +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 378/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.171041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:55,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43414 samples/s/p 3:49:57 } +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 380/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.170478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43747 samples/s/p 3:49:45 } +2024-07-25 21:20:01,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 382/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.1699154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:01,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43178 samples/s/p 3:49:57 } +2024-07-25 21:20:04,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 384/ 1625], loss: 1.186, per_step_time: 1469ms, lr: 2.169352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:04,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.44422 samples/s/p 3:49:22 } +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 386/ 1625], loss: 1.215, per_step_time: 1474ms, lr: 2.1687883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42451 samples/s/p 3:50:09 } +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 388/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.1682252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43562 samples/s/p 3:49:38 } +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 390/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.1676618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:13,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42906 samples/s/p 3:49:52 } +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 392/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.1670981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42935 samples/s/p 3:49:48 } +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 394/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.1665343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43119 samples/s/p 3:49:41 } +2024-07-25 21:20:22,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 396/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.1659704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:22,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43806 samples/s/p 3:49:20 } +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 398/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 2.1654067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43009 samples/s/p 3:49:38 } +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 400/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.1648422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43135 samples/s/p 3:49:31 } +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 402/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.164278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43421 samples/s/p 3:49:21 } +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 404/ 1625], loss: 1.232, per_step_time: 1474ms, lr: 2.1637139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42570 samples/s/p 3:49:40 } +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 406/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.1631497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44090 samples/s/p 3:48:58 } +2024-07-25 21:20:39,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 408/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.1625845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43184 samples/s/p 3:49:18 } +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 410/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.1620202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43538 samples/s/p 3:49:06 } +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 412/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.1614554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:45,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44006 samples/s/p 3:48:52 } +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 414/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.1608905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:48,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42914 samples/s/p 3:49:16 } +2024-07-25 21:20:51,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 416/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.1603255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:51,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43854 samples/s/p 3:48:50 } +2024-07-25 21:20:54,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 418/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 2.1597603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43982 samples/s/p 3:48:43 } +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 420/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.159195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.42763 samples/s/p 3:49:11 } +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 422/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.1586296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43600 samples/s/p 3:48:47 } +2024-07-25 21:21:03,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 424/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.1580643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:03,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43816 samples/s/p 3:48:39 } +2024-07-25 21:21:06,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 426/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.1574986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:06,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44159 samples/s/p 3:48:27 } +2024-07-25 21:21:09,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 428/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1569329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:09,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43910 samples/s/p 3:48:31 } +2024-07-25 21:21:12,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 430/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.1563672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:12,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44090 samples/s/p 3:48:23 } +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 432/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1558013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44033 samples/s/p 3:48:22 } +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 434/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.1552352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43576 samples/s/p 3:48:30 } +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 436/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.1546688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43666 samples/s/p 3:48:25 } +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 438/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.1541025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:24,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42843 samples/s/p 3:48:43 } +2024-07-25 21:21:27,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 440/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.1535363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:27,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43441 samples/s/p 3:48:25 } +2024-07-25 21:21:30,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 442/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.1529699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:30,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43436 samples/s/p 3:48:22 } +2024-07-25 21:21:33,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 444/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 2.1524032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42919 samples/s/p 3:48:32 } +2024-07-25 21:21:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 446/ 1625], loss: 1.057, per_step_time: 1469ms, lr: 2.1518365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:36,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44246 samples/s/p 3:47:56 } +2024-07-25 21:21:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 448/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.1512697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43494 samples/s/p 3:48:12 } +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 450/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.1507029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43148 samples/s/p 3:48:17 } +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 452/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.1501357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43278 samples/s/p 3:48:11 } +2024-07-25 21:21:47,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 454/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.1495687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:47,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.42470 samples/s/p 3:48:29 } +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 456/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 2.1490014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43535 samples/s/p 3:47:59 } +2024-07-25 21:21:53,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 458/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.148434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:53,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43207 samples/s/p 3:48:04 } +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 460/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.1478665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43787 samples/s/p 3:47:47 } +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 462/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.147299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43695 samples/s/p 3:47:46 } +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 464/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.1467313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43444 samples/s/p 3:47:49 } +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 466/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.1461634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.42962 samples/s/p 3:47:59 } +2024-07-25 21:22:08,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 468/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.1455955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43488 samples/s/p 3:47:42 } +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 470/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.1450276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43607 samples/s/p 3:47:36 } +2024-07-25 21:22:14,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 472/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 2.1444595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:14,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43345 samples/s/p 3:47:40 } +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 474/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.143891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.44170 samples/s/p 3:47:16 } +2024-07-25 21:22:20,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 476/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.1433229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:20,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43514 samples/s/p 3:47:30 } +2024-07-25 21:22:23,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 478/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.1427542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43123 samples/s/p 3:47:37 } +2024-07-25 21:22:26,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 480/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.1421858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:26,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43649 samples/s/p 3:47:21 } +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.141617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:29,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43848 samples/s/p 3:47:13 } +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 484/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 2.1410482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44300 samples/s/p 3:46:58 } +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 486/ 1625], loss: 1.282, per_step_time: 1468ms, lr: 2.1404794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44697 samples/s/p 3:46:46 } +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 488/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1399102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43524 samples/s/p 3:47:12 } +2024-07-25 21:22:40,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 490/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.139341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:40,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44156 samples/s/p 3:46:53 } +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 492/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.1387721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43415 samples/s/p 3:47:09 } +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 494/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.1382028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43292 samples/s/p 3:47:09 } +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 496/ 1625], loss: 1.150, per_step_time: 1470ms, lr: 2.137633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43948 samples/s/p 3:46:50 } +2024-07-25 21:22:52,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 498/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.1370637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:52,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43400 samples/s/p 3:47:00 } +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 500/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.136494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43749 samples/s/p 3:46:49 } +2024-07-25 21:22:55,671 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 502/ 1625], loss: 1.250, per_step_time: 1572ms, lr: 2.1359243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:31,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.08706 samples/s/p 4:02:23 } +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 504/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.1353544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.42273 samples/s/p 3:47:20 } +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 506/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.1347843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43425 samples/s/p 3:46:48 } +2024-07-25 21:23:40,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 508/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1342143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:40,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43038 samples/s/p 3:46:55 } +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 510/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 2.133644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:43,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43510 samples/s/p 3:46:40 } +2024-07-25 21:23:46,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 512/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.1330738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:46,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43064 samples/s/p 3:46:48 } +2024-07-25 21:23:49,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 514/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1325033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:49,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43855 samples/s/p 3:46:25 } +2024-07-25 21:23:52,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 516/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.1319329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:52,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43109 samples/s/p 3:46:41 } +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.1313623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43159 samples/s/p 3:46:37 } +2024-07-25 21:23:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 520/ 1625], loss: 1.310, per_step_time: 1473ms, lr: 2.1307915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:57,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43084 samples/s/p 3:46:36 } +2024-07-25 21:24:00,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 522/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.1302207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:00,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43769 samples/s/p 3:46:16 } +2024-07-25 21:24:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 524/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.1296497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:03,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43663 samples/s/p 3:46:16 } +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 526/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.1290785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43385 samples/s/p 3:46:20 } +2024-07-25 21:24:09,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 528/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.1285074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:09,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43796 samples/s/p 3:46:06 } +2024-07-25 21:24:12,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 530/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 2.1279362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:12,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.44375 samples/s/p 3:45:49 } +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 532/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 2.1273649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:15,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43911 samples/s/p 3:45:58 } +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 534/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.1267933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43564 samples/s/p 3:46:03 } +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 536/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.1262214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43463 samples/s/p 3:46:03 } +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 538/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.1256501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43558 samples/s/p 3:45:58 } +2024-07-25 21:24:27,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 540/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 2.125078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:27,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43541 samples/s/p 3:45:55 } +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 542/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.1245063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43612 samples/s/p 3:45:50 } +2024-07-25 21:24:33,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 544/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.1239342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43334 samples/s/p 3:45:54 } +2024-07-25 21:24:36,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 546/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.1233622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:36,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44038 samples/s/p 3:45:34 } +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 548/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.12279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43350 samples/s/p 3:45:48 } +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 550/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.1222175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43881 samples/s/p 3:45:32 } +2024-07-25 21:24:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 552/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 2.121645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43740 samples/s/p 3:45:32 } +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 554/ 1625], loss: 0.905, per_step_time: 1470ms, lr: 2.1210728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43879 samples/s/p 3:45:26 } +2024-07-25 21:24:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 556/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.1204998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:51,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43259 samples/s/p 3:45:39 } +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 558/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.119927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44003 samples/s/p 3:45:17 } +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 560/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.1193544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43392 samples/s/p 3:45:29 } +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 562/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.1187814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:59,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43828 samples/s/p 3:45:16 } +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 564/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.118208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:02,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43865 samples/s/p 3:45:12 } +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 566/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.1176353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:05,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.44357 samples/s/p 3:44:57 } +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 568/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.117062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:08,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43303 samples/s/p 3:45:20 } +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 570/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.1164886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43001 samples/s/p 3:45:24 } +2024-07-25 21:25:14,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 572/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.1159149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:14,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43245 samples/s/p 3:45:15 } +2024-07-25 21:25:17,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 574/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.1153413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:17,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43523 samples/s/p 3:45:05 } +2024-07-25 21:25:20,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 576/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.1147678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43239 samples/s/p 3:45:10 } +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 578/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 2.1141937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.44444 samples/s/p 3:44:37 } +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 580/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.1136198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:26,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43266 samples/s/p 3:45:03 } +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 582/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 2.113046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42453 samples/s/p 3:45:20 } +2024-07-25 21:25:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 584/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.1124719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:32,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42893 samples/s/p 3:45:06 } +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 586/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1118974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43362 samples/s/p 3:44:52 } +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 588/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1113232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43841 samples/s/p 3:44:37 } +2024-07-25 21:25:41,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 590/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.110749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:41,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42999 samples/s/p 3:44:55 } +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 592/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.1101741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42824 samples/s/p 3:44:56 } +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 594/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 2.1095995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43478 samples/s/p 3:44:37 } +2024-07-25 21:25:50,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 596/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.1090249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:50,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43582 samples/s/p 3:44:32 } +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 598/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 2.1084501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:53,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44026 samples/s/p 3:44:18 } +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 600/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.107875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:55,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44040 samples/s/p 3:44:14 } +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 602/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.1073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43722 samples/s/p 3:44:19 } +2024-07-25 21:26:01,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 604/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.106725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:01,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42991 samples/s/p 3:44:34 } +2024-07-25 21:26:04,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 606/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.1061498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:04,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43078 samples/s/p 3:44:29 } +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 608/ 1625], loss: 1.133, per_step_time: 1474ms, lr: 2.1055741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42741 samples/s/p 3:44:35 } +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 610/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.104999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44190 samples/s/p 3:43:56 } +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 612/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.1044234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:13,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44407 samples/s/p 3:43:48 } +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 614/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.1038477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43955 samples/s/p 3:43:56 } +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 616/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1032718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43472 samples/s/p 3:44:05 } +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 618/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.1026959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43393 samples/s/p 3:44:04 } +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 620/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.1021202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43407 samples/s/p 3:44:01 } +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 622/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.101544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:28,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43495 samples/s/p 3:43:55 } +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 624/ 1625], loss: 1.141, per_step_time: 1475ms, lr: 2.1009677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:31,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.42259 samples/s/p 3:44:23 } +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 626/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.1003914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.42543 samples/s/p 3:44:13 } +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 628/ 1625], loss: 1.325, per_step_time: 1484ms, lr: 2.0998152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.38987 samples/s/p 3:45:39 } +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 630/ 1625], loss: 0.967, per_step_time: 1470ms, lr: 2.0992386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44217 samples/s/p 3:43:26 } +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 632/ 1625], loss: 1.023, per_step_time: 1470ms, lr: 2.0986621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44024 samples/s/p 3:43:28 } +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 634/ 1625], loss: 1.285, per_step_time: 1477ms, lr: 2.0980855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.41450 samples/s/p 3:44:29 } +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 636/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.0975087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43687 samples/s/p 3:43:30 } +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 638/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.0969317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43566 samples/s/p 3:43:30 } +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 640/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.0963547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43608 samples/s/p 3:43:26 } +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 642/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.0957777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43463 samples/s/p 3:43:27 } +2024-07-25 21:27:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 644/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.0952004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43148 samples/s/p 3:43:32 } +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 646/ 1625], loss: 0.978, per_step_time: 1472ms, lr: 2.094623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43219 samples/s/p 3:43:27 } +2024-07-25 21:27:06,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 648/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.0940459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:06,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43756 samples/s/p 3:43:11 } +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 650/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.0934684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42930 samples/s/p 3:43:28 } +2024-07-25 21:27:12,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 652/ 1625], loss: 0.972, per_step_time: 1473ms, lr: 2.0928905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43068 samples/s/p 3:43:22 } +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 654/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.0923131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43977 samples/s/p 3:42:57 } +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 656/ 1625], loss: 0.980, per_step_time: 1473ms, lr: 2.0917352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:18,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42915 samples/s/p 3:43:20 } +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 658/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0911573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42751 samples/s/p 3:43:21 } +2024-07-25 21:27:24,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 660/ 1625], loss: 1.027, per_step_time: 1482ms, lr: 2.0905793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.39662 samples/s/p 3:44:35 } +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 662/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.0900014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.42854 samples/s/p 3:43:12 } +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 664/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0894231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43886 samples/s/p 3:42:44 } +2024-07-25 21:27:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 666/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.0888447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43869 samples/s/p 3:42:42 } +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 668/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.0882664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43499 samples/s/p 3:42:48 } +2024-07-25 21:27:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 670/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.087688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:39,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43414 samples/s/p 3:42:47 } +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 672/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0871095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43906 samples/s/p 3:42:32 } +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 674/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.0865305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43091 samples/s/p 3:42:49 } +2024-07-25 21:27:48,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 676/ 1625], loss: 0.871, per_step_time: 1471ms, lr: 2.085952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:48,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43586 samples/s/p 3:42:34 } +2024-07-25 21:27:51,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 678/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.085373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:51,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43659 samples/s/p 3:42:29 } +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 680/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.0847941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43367 samples/s/p 3:42:33 } +2024-07-25 21:27:57,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 682/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.084215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:57,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.42856 samples/s/p 3:42:43 } +2024-07-25 21:27:59,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 684/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 2.0836358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:59,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43610 samples/s/p 3:42:21 } +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 686/ 1625], loss: 1.146, per_step_time: 1469ms, lr: 2.0830565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.44301 samples/s/p 3:42:02 } +2024-07-25 21:28:05,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 688/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.0824771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:05,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43596 samples/s/p 3:42:16 } +2024-07-25 21:28:08,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 690/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.0818976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43645 samples/s/p 3:42:12 } +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 692/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.081318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44062 samples/s/p 3:41:59 } +2024-07-25 21:28:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 694/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 2.0807383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44076 samples/s/p 3:41:55 } +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 696/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0801584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:17,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43738 samples/s/p 3:42:01 } +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 698/ 1625], loss: 1.093, per_step_time: 1474ms, lr: 2.0795787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.42650 samples/s/p 3:42:24 } +2024-07-25 21:28:23,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 700/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.0789988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43370 samples/s/p 3:42:04 } +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 702/ 1625], loss: 0.915, per_step_time: 1472ms, lr: 2.0784188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43463 samples/s/p 3:41:59 } +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 704/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.0778387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43200 samples/s/p 3:42:02 } +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 706/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.0772584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43765 samples/s/p 3:41:45 } +2024-07-25 21:28:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 708/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.076678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:35,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43780 samples/s/p 3:41:42 } +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 710/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.0760977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43291 samples/s/p 3:41:51 } +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 712/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.075517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43039 samples/s/p 3:41:54 } +2024-07-25 21:28:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 714/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.0749363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42918 samples/s/p 3:41:54 } +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 716/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 2.0743557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43193 samples/s/p 3:41:45 } +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 718/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 2.0737749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42403 samples/s/p 3:42:01 } +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 720/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.0731939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43267 samples/s/p 3:41:37 } +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 722/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.0726127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43614 samples/s/p 3:41:25 } +2024-07-25 21:28:58,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 724/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.0720316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:58,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43690 samples/s/p 3:41:21 } +2024-07-25 21:29:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 726/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 2.0714504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:01,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43712 samples/s/p 3:41:17 } +2024-07-25 21:29:04,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 728/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.070869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:04,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43128 samples/s/p 3:41:28 } +2024-07-25 21:29:07,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 730/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0702877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:07,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43174 samples/s/p 3:41:24 } +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 732/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 2.0697064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43584 samples/s/p 3:41:11 } +2024-07-25 21:29:13,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 734/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.0691246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43887 samples/s/p 3:41:01 } +2024-07-25 21:29:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 736/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 2.0685427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43128 samples/s/p 3:41:17 } +2024-07-25 21:29:19,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 738/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.067961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:19,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43665 samples/s/p 3:41:01 } +2024-07-25 21:29:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 740/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.0673793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:22,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43718 samples/s/p 3:40:56 } +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 742/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.066797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43178 samples/s/p 3:41:07 } +2024-07-25 21:29:28,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 744/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.0662152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43167 samples/s/p 3:41:04 } +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 746/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.0656329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43763 samples/s/p 3:40:46 } +2024-07-25 21:29:34,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 748/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0650506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:34,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43072 samples/s/p 3:41:00 } +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 750/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0644682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43954 samples/s/p 3:40:36 } +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 752/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0638858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43292 samples/s/p 3:40:49 } +2024-07-25 21:29:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 754/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.0633033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:43,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.42996 samples/s/p 3:40:53 } +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 756/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.0627205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43925 samples/s/p 3:40:28 } +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 758/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.0621379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:49,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43625 samples/s/p 3:40:32 } +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 760/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.061555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44226 samples/s/p 3:40:15 } +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 762/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.0609721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43854 samples/s/p 3:40:21 } +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 764/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.060389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43949 samples/s/p 3:40:15 } +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 766/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0598058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43509 samples/s/p 3:40:23 } +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 768/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.0592226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44053 samples/s/p 3:40:07 } +2024-07-25 21:30:06,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 770/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0586393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44118 samples/s/p 3:40:03 } +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 772/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 2.0580559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43064 samples/s/p 3:40:25 } +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 774/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.0574724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43151 samples/s/p 3:40:20 } +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 776/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.056889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43102 samples/s/p 3:40:18 } +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 778/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 2.0563051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43596 samples/s/p 3:40:03 } +2024-07-25 21:30:21,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 780/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0557212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:21,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43825 samples/s/p 3:39:55 } +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 782/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.0551375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44167 samples/s/p 3:39:44 } +2024-07-25 21:30:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 784/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.0545536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:27,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43341 samples/s/p 3:40:01 } +2024-07-25 21:30:30,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 786/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.0539694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:30,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44018 samples/s/p 3:39:41 } +2024-07-25 21:30:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 788/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 2.0533853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44038 samples/s/p 3:39:38 } +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 790/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.052801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43805 samples/s/p 3:39:41 } +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 792/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.0522168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43751 samples/s/p 3:39:39 } +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 794/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.0516321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.42937 samples/s/p 3:39:56 } +2024-07-25 21:30:45,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 796/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.0510477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43939 samples/s/p 3:39:29 } +2024-07-25 21:30:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 798/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 2.0504633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43293 samples/s/p 3:39:41 } +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 800/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.0498783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:51,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43857 samples/s/p 3:39:25 } +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 802/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.0492935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43200 samples/s/p 3:39:38 } +2024-07-25 21:30:57,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 804/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.0487088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:57,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43182 samples/s/p 3:39:35 } +2024-07-25 21:30:59,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 806/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.0481237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:59,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43816 samples/s/p 3:39:17 } +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 808/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 2.0475385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43488 samples/s/p 3:39:22 } +2024-07-25 21:31:05,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 810/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 2.0469535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:05,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.42952 samples/s/p 3:39:32 } +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 812/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.0463682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43228 samples/s/p 3:39:22 } +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 814/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0457828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43565 samples/s/p 3:39:11 } +2024-07-25 21:31:14,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 816/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.0451973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:14,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43381 samples/s/p 3:39:13 } +2024-07-25 21:31:17,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 818/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.044612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:17,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43264 samples/s/p 3:39:13 } +2024-07-25 21:31:20,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 820/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.0440262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:20,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43863 samples/s/p 3:38:55 } +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 822/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0434405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43265 samples/s/p 3:39:07 } +2024-07-25 21:31:26,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 824/ 1625], loss: 1.036, per_step_time: 1476ms, lr: 2.0428546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.41968 samples/s/p 3:39:35 } +2024-07-25 21:31:29,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 826/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.0422689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:29,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43287 samples/s/p 3:39:00 } +2024-07-25 21:31:32,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 828/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0416826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:32,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43260 samples/s/p 3:38:58 } +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 830/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.0410966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43743 samples/s/p 3:38:43 } +2024-07-25 21:31:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 832/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 2.0405107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.42996 samples/s/p 3:38:58 } +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 834/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0399242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:41,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.44014 samples/s/p 3:38:31 } +2024-07-25 21:31:44,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 836/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.039338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:44,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43684 samples/s/p 3:38:36 } +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 838/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.0387515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.42839 samples/s/p 3:38:53 } +2024-07-25 21:31:50,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 840/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.0381647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:50,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43061 samples/s/p 3:38:45 } +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 842/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.037578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:53,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44069 samples/s/p 3:38:18 } +2024-07-25 21:31:56,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 844/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.0369915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43392 samples/s/p 3:38:31 } +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 846/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 2.0364047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44161 samples/s/p 3:38:10 } +2024-07-25 21:32:01,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 848/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.035818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:01,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43198 samples/s/p 3:38:30 } +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 850/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.0352309e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43521 samples/s/p 3:38:19 } +2024-07-25 21:32:07,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 852/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.0346435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:07,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43413 samples/s/p 3:38:19 } +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 854/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 2.0340565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43421 samples/s/p 3:38:16 } +2024-07-25 21:32:13,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 856/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.0334694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43919 samples/s/p 3:38:01 } +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 858/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.032882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43862 samples/s/p 3:37:59 } +2024-07-25 21:32:19,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 860/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.0322945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:19,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43231 samples/s/p 3:38:12 } +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 862/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.031707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43367 samples/s/p 3:38:05 } +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 864/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.0311192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43729 samples/s/p 3:37:54 } +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 866/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.0305315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:28,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43241 samples/s/p 3:38:02 } +2024-07-25 21:32:31,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 868/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 2.0299438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:31,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43090 samples/s/p 3:38:03 } +2024-07-25 21:32:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 870/ 1625], loss: 1.496, per_step_time: 1473ms, lr: 2.0293563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:34,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43108 samples/s/p 3:38:00 } +2024-07-25 21:32:37,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 872/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.0287682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:37,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43790 samples/s/p 3:37:40 } +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 874/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.0281801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.42886 samples/s/p 3:37:59 } +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 876/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 2.0275918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44451 samples/s/p 3:37:19 } +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 878/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0270036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43487 samples/s/p 3:37:39 } +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 880/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.0264153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43752 samples/s/p 3:37:30 } +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 882/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0258269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:52,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44193 samples/s/p 3:37:16 } +2024-07-25 21:32:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 884/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 2.0252384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:55,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43931 samples/s/p 3:37:19 } +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 886/ 1625], loss: 1.130, per_step_time: 1474ms, lr: 2.0246498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.42634 samples/s/p 3:37:48 } +2024-07-25 21:33:00,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 888/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.0240614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:00,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43384 samples/s/p 3:37:27 } +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 890/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.0234722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:03,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43093 samples/s/p 3:37:31 } +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 892/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 2.0228836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43635 samples/s/p 3:37:15 } +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 894/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.0222948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:09,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43726 samples/s/p 3:37:10 } +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 896/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.0217056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43527 samples/s/p 3:37:11 } +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 898/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.0211166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:15,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43830 samples/s/p 3:37:01 } +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 900/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.0205272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43733 samples/s/p 3:37:01 } +2024-07-25 21:33:21,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 902/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.019938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:21,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43435 samples/s/p 3:37:05 } +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 904/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.0193487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43541 samples/s/p 3:36:59 } +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 906/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.0187592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43491 samples/s/p 3:36:58 } +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 908/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.0181697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.42752 samples/s/p 3:37:12 } +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 910/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.0175801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43666 samples/s/p 3:36:47 } +2024-07-25 21:33:36,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 912/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0169902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:36,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43564 samples/s/p 3:36:47 } +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 914/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.0164005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43879 samples/s/p 3:36:37 } +2024-07-25 21:33:42,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 916/ 1625], loss: 1.342, per_step_time: 1471ms, lr: 2.0158106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:42,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43540 samples/s/p 3:36:42 } +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 918/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.0152207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43406 samples/s/p 3:36:42 } +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 920/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.0146306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43831 samples/s/p 3:36:29 } +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 922/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.0140405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43439 samples/s/p 3:36:35 } +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 924/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.0134501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42994 samples/s/p 3:36:43 } +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 926/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.0128598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:57,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43174 samples/s/p 3:36:36 } +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 928/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0122696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:59,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43286 samples/s/p 3:36:30 } +2024-07-25 21:34:02,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 930/ 1625], loss: 1.146, per_step_time: 1474ms, lr: 2.011679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:02,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42539 samples/s/p 3:36:45 } +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 932/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0110887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43715 samples/s/p 3:36:14 } +2024-07-25 21:34:08,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 934/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.0104979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:08,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43382 samples/s/p 3:36:19 } +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 936/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.009907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43461 samples/s/p 3:36:14 } +2024-07-25 21:34:14,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 938/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0093163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43511 samples/s/p 3:36:10 } +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 940/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 2.0087255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43752 samples/s/p 3:36:01 } +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 942/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.0081343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43348 samples/s/p 3:36:08 } +2024-07-25 21:34:23,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 944/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.0075433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:23,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43539 samples/s/p 3:36:00 } +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 946/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.0069521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43518 samples/s/p 3:35:58 } +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 948/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.0063608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43395 samples/s/p 3:35:58 } +2024-07-25 21:34:32,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 950/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.0057694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:32,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43166 samples/s/p 3:36:01 } +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 952/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.005178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43301 samples/s/p 3:35:54 } +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 954/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0045867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43502 samples/s/p 3:35:47 } +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 956/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.003995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.42943 samples/s/p 3:35:57 } +2024-07-25 21:34:44,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 958/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.0034033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:44,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43511 samples/s/p 3:35:41 } +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 960/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.0028117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.44337 samples/s/p 3:35:18 } +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 962/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0022198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43783 samples/s/p 3:35:28 } +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 964/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.0016278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43514 samples/s/p 3:35:32 } +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 966/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0010359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:56,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43211 samples/s/p 3:35:36 } +2024-07-25 21:34:59,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 968/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0004436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:59,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43693 samples/s/p 3:35:21 } +2024-07-25 21:35:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 970/ 1625], loss: 1.516, per_step_time: 1472ms, lr: 1.9998517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:01,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43111 samples/s/p 3:35:32 } +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 972/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.9992593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43123 samples/s/p 3:35:29 } +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 974/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.998667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43240 samples/s/p 3:35:23 } +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 976/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.9980747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43699 samples/s/p 3:35:10 } +2024-07-25 21:35:13,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 978/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.997482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:13,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43508 samples/s/p 3:35:11 } +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 980/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 1.9968895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.42985 samples/s/p 3:35:21 } +2024-07-25 21:35:19,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 982/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.9962969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:19,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43628 samples/s/p 3:35:02 } +2024-07-25 21:35:22,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 984/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9957042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:22,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43282 samples/s/p 3:35:08 } +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 986/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.995111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42846 samples/s/p 3:35:15 } +2024-07-25 21:35:28,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 988/ 1625], loss: 1.168, per_step_time: 1475ms, lr: 1.9945184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:28,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42240 samples/s/p 3:35:27 } +2024-07-25 21:35:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 990/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.9939254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42731 samples/s/p 3:35:12 } +2024-07-25 21:35:34,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 992/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 1.9933323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43304 samples/s/p 3:34:55 } +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 994/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.992739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:37,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43155 samples/s/p 3:34:56 } +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 996/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.992146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.44045 samples/s/p 3:34:32 } +2024-07-25 21:35:43,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 998/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.9915527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:43,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43696 samples/s/p 3:34:37 } +2024-07-25 21:35:46,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1000/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.9909592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:46,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44197 samples/s/p 3:34:22 } +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1002/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9903657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:49,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44003 samples/s/p 3:34:24 } +2024-07-25 21:35:52,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1004/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 1.9897721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:52,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43571 samples/s/p 3:34:31 } +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1006/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9891784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43984 samples/s/p 3:34:19 } +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1008/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.9885845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43413 samples/s/p 3:34:29 } +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1010/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.987991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43834 samples/s/p 3:34:16 } +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1012/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.987397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43290 samples/s/p 3:34:26 } +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1014/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 1.9868032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:06,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43342 samples/s/p 3:34:22 } +2024-07-25 21:36:09,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1016/ 1625], loss: 1.047, per_step_time: 1474ms, lr: 1.986209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:09,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42677 samples/s/p 3:34:35 } +2024-07-25 21:36:12,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1018/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.9856148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:12,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43342 samples/s/p 3:34:16 } +2024-07-25 21:36:15,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1020/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 1.9850208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:15,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43227 samples/s/p 3:34:16 } +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1022/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.9844263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:18,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42951 samples/s/p 3:34:20 } +2024-07-25 21:36:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1024/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.9838319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:21,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43292 samples/s/p 3:34:09 } +2024-07-25 21:36:24,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1026/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9832376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:24,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43631 samples/s/p 3:33:58 } +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1028/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.982643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43160 samples/s/p 3:34:06 } +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1030/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.9820483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43066 samples/s/p 3:34:05 } +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1032/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.9814537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43361 samples/s/p 3:33:55 } +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1034/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.980859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43716 samples/s/p 3:33:44 } +2024-07-25 21:36:39,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.9802641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:39,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43332 samples/s/p 3:33:50 } +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1038/ 1625], loss: 1.288, per_step_time: 1470ms, lr: 1.9796691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43957 samples/s/p 3:33:32 } +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1040/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.9790741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43144 samples/s/p 3:33:49 } +2024-07-25 21:36:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1042/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.978479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43752 samples/s/p 3:33:31 } +2024-07-25 21:36:51,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1044/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.977884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43958 samples/s/p 3:33:23 } +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1046/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.9772886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43329 samples/s/p 3:33:35 } +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1048/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.9766934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43860 samples/s/p 3:33:20 } +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1050/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.9760979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43634 samples/s/p 3:33:22 } +2024-07-25 21:37:02,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1052/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.9755025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:02,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43015 samples/s/p 3:33:34 } +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1054/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 1.974907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:05,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43545 samples/s/p 3:33:18 } +2024-07-25 21:37:08,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1056/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.9743113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43320 samples/s/p 3:33:21 } +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1058/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.9737156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43246 samples/s/p 3:33:20 } +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1060/ 1625], loss: 1.250, per_step_time: 1480ms, lr: 1.9731197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.40235 samples/s/p 3:34:28 } +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1062/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.972524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43540 samples/s/p 3:33:07 } +2024-07-25 21:37:20,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1064/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.9719278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:20,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.42868 samples/s/p 3:33:20 } +2024-07-25 21:37:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1066/ 1625], loss: 1.407, per_step_time: 1471ms, lr: 1.971332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:23,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43511 samples/s/p 3:33:02 } +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1068/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 1.9707357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43508 samples/s/p 3:32:59 } +2024-07-25 21:37:29,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1070/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 1.9701396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:29,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.42774 samples/s/p 3:33:13 } +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1072/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 1.9695433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43936 samples/s/p 3:32:43 } +2024-07-25 21:37:35,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1074/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.968947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:35,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43747 samples/s/p 3:32:44 } +2024-07-25 21:37:38,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1076/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 1.9683506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43443 samples/s/p 3:32:48 } +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1078/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 1.967754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43041 samples/s/p 3:32:55 } +2024-07-25 21:37:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1080/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.9671574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43812 samples/s/p 3:32:34 } +2024-07-25 21:37:47,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1082/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.966561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:47,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43797 samples/s/p 3:32:31 } +2024-07-25 21:37:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1084/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.9659641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:50,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43303 samples/s/p 3:32:40 } +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1086/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.9653671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43460 samples/s/p 3:32:33 } +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1088/ 1625], loss: 0.941, per_step_time: 1471ms, lr: 1.9647705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43544 samples/s/p 3:32:28 } +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1090/ 1625], loss: 1.373, per_step_time: 1472ms, lr: 1.9641735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43285 samples/s/p 3:32:32 } +2024-07-25 21:38:02,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1092/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.9635765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:02,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43915 samples/s/p 3:32:14 } +2024-07-25 21:38:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1094/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 1.9629793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43815 samples/s/p 3:32:13 } +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1096/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 1.9623822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43435 samples/s/p 3:32:19 } +2024-07-25 21:38:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1098/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.961785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43396 samples/s/p 3:32:17 } +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1100/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.9611876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.42980 samples/s/p 3:32:24 } +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1102/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.9605903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43455 samples/s/p 3:32:10 } +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1104/ 1625], loss: 0.958, per_step_time: 1471ms, lr: 1.9599927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:19,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43801 samples/s/p 3:31:59 } +2024-07-25 21:38:22,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1106/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.9593952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43275 samples/s/p 3:32:08 } +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1108/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 1.9587973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.44402 samples/s/p 3:31:39 } +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1110/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 1.9581998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43558 samples/s/p 3:31:56 } +2024-07-25 21:38:31,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1112/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 1.9576019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:31,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43018 samples/s/p 3:32:05 } +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1114/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.957004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42820 samples/s/p 3:32:07 } +2024-07-25 21:38:37,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1116/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.956406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:37,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43685 samples/s/p 3:31:44 } +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1118/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.955808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43597 samples/s/p 3:31:43 } +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1120/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.95521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43036 samples/s/p 3:31:53 } +2024-07-25 21:38:46,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1122/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.954612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:46,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43580 samples/s/p 3:31:38 } +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1124/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.9540135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:49,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43130 samples/s/p 3:31:45 } +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1126/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.9534153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42968 samples/s/p 3:31:46 } +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1128/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.9528168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43113 samples/s/p 3:31:40 } +2024-07-25 21:38:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1130/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 1.9522184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43950 samples/s/p 3:31:17 } +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1132/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.95162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:01,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43503 samples/s/p 3:31:25 } +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1134/ 1625], loss: 1.303, per_step_time: 1471ms, lr: 1.9510213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43840 samples/s/p 3:31:14 } +2024-07-25 21:39:06,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1136/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.9504225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:06,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43630 samples/s/p 3:31:16 } +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1138/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9498239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43485 samples/s/p 3:31:16 } +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1140/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.949225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43680 samples/s/p 3:31:09 } +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1142/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.948626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43696 samples/s/p 3:31:05 } +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1144/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.948027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:18,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43271 samples/s/p 3:31:12 } +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1146/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.947428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43691 samples/s/p 3:31:00 } +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1148/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.9468289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.42939 samples/s/p 3:31:14 } +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1150/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.9462297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43460 samples/s/p 3:30:59 } +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1152/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.9456304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43526 samples/s/p 3:30:55 } +2024-07-25 21:39:33,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1154/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.9450312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:33,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43680 samples/s/p 3:30:48 } +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1156/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.9444315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43627 samples/s/p 3:30:46 } +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1158/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.9438321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43675 samples/s/p 3:30:42 } +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1160/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.9432326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.44001 samples/s/p 3:30:32 } +2024-07-25 21:39:45,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1162/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.942633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:45,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.44119 samples/s/p 3:30:26 } +2024-07-25 21:39:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1164/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.942033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43238 samples/s/p 3:30:44 } +2024-07-25 21:39:51,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1166/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.9414336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:51,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43651 samples/s/p 3:30:31 } +2024-07-25 21:39:54,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1168/ 1625], loss: 1.320, per_step_time: 1470ms, lr: 1.9408335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:54,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43981 samples/s/p 3:30:21 } +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1170/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.9402336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43382 samples/s/p 3:30:31 } +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1172/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.9396337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43123 samples/s/p 3:30:35 } +2024-07-25 21:40:03,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1174/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.9390336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:03,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43038 samples/s/p 3:30:34 } +2024-07-25 21:40:05,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1176/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9384335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:05,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43715 samples/s/p 3:30:15 } +2024-07-25 21:40:08,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1178/ 1625], loss: 1.039, per_step_time: 1474ms, lr: 1.9378333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:08,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.42569 samples/s/p 3:30:39 } +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1180/ 1625], loss: 1.450, per_step_time: 1472ms, lr: 1.9372328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43455 samples/s/p 3:30:15 } +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1182/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 1.9366327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43829 samples/s/p 3:30:03 } +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 1.9360323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43458 samples/s/p 3:30:09 } +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1186/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.9354316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:20,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43816 samples/s/p 3:29:58 } +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1188/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 1.934831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.44549 samples/s/p 3:29:38 } +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1190/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.9342304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43421 samples/s/p 3:30:01 } +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1192/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.9336298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43726 samples/s/p 3:29:51 } +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1194/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.933029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43340 samples/s/p 3:29:57 } +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1196/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.9324281e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43102 samples/s/p 3:30:00 } +2024-07-25 21:40:38,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1198/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.9318273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:38,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43280 samples/s/p 3:29:53 } +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1200/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.9312261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43377 samples/s/p 3:29:47 } +2024-07-25 21:40:44,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1202/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.930625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:44,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43876 samples/s/p 3:29:33 } +2024-07-25 21:40:47,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1204/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.930024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43073 samples/s/p 3:29:49 } +2024-07-25 21:40:50,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1206/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.9294228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:50,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44142 samples/s/p 3:29:21 } +2024-07-25 21:40:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1208/ 1625], loss: 0.975, per_step_time: 1469ms, lr: 1.9288214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44394 samples/s/p 3:29:12 } +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1210/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 1.92822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43468 samples/s/p 3:29:31 } +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1212/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.9276187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44146 samples/s/p 3:29:12 } +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1214/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.9270172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43389 samples/s/p 3:29:27 } +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1216/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.9264156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43391 samples/s/p 3:29:24 } +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1218/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.925814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43468 samples/s/p 3:29:19 } +2024-07-25 21:41:10,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1220/ 1625], loss: 1.007, per_step_time: 1473ms, lr: 1.9252126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:10,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.42938 samples/s/p 3:29:28 } +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1222/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9246108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43620 samples/s/p 3:29:09 } +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1224/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.9240086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43862 samples/s/p 3:29:01 } +2024-07-25 21:41:19,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1226/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.9234069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:19,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44257 samples/s/p 3:28:49 } +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1228/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.922805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:22,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43579 samples/s/p 3:29:02 } +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1230/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.9222029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.44085 samples/s/p 3:28:47 } +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1232/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9216008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43787 samples/s/p 3:28:51 } +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1234/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.9209985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43561 samples/s/p 3:28:53 } +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1236/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.9203962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43599 samples/s/p 3:28:49 } +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1238/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.919794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43757 samples/s/p 3:28:43 } +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1240/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.9191915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43434 samples/s/p 3:28:47 } +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1242/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.918589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43430 samples/s/p 3:28:44 } +2024-07-25 21:41:46,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1244/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:46,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.44127 samples/s/p 3:28:25 } +2024-07-25 21:41:49,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1246/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.917384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:49,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43464 samples/s/p 3:28:38 } +2024-07-25 21:41:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1248/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 1.9167815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43102 samples/s/p 3:28:43 } +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1250/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.9161786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:55,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43890 samples/s/p 3:28:22 } +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1252/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.915576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:58,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43108 samples/s/p 3:28:37 } +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1254/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.914973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43696 samples/s/p 3:28:21 } +2024-07-25 21:42:03,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1256/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9143701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:03,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43130 samples/s/p 3:28:31 } +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1258/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.913767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43758 samples/s/p 3:28:13 } +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1260/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 1.9131641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44222 samples/s/p 3:28:00 } +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1262/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.9125608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:12,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43953 samples/s/p 3:28:03 } +2024-07-25 21:42:15,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1264/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.9119578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:15,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43029 samples/s/p 3:28:21 } +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1266/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.9113546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43539 samples/s/p 3:28:07 } +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1268/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.910751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43997 samples/s/p 3:27:53 } +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.9101477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43495 samples/s/p 3:28:02 } +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1272/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 1.9095443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43719 samples/s/p 3:27:54 } +2024-07-25 21:42:30,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1274/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.9089408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:30,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43276 samples/s/p 3:28:01 } +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1276/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.908337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43667 samples/s/p 3:27:49 } +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1278/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.9077335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42923 samples/s/p 3:28:03 } +2024-07-25 21:42:39,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1280/ 1625], loss: 0.998, per_step_time: 1473ms, lr: 1.9071298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:39,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42965 samples/s/p 3:27:59 } +2024-07-25 21:42:42,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1282/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.9065259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:42,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43660 samples/s/p 3:27:40 } +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1284/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.9059222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:45,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43600 samples/s/p 3:27:39 } +2024-07-25 21:42:48,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1286/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.9053183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:48,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.44158 samples/s/p 3:27:23 } +2024-07-25 21:42:51,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1288/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 1.9047144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:51,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43739 samples/s/p 3:27:30 } +2024-07-25 21:42:54,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1290/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9041101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43773 samples/s/p 3:27:26 } +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1292/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9035058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43627 samples/s/p 3:27:26 } +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1294/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 1.902902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:00,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.42638 samples/s/p 3:27:46 } +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1296/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.9022977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43954 samples/s/p 3:27:13 } +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1298/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 1.9016934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43687 samples/s/p 3:27:16 } +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1300/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.901089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43423 samples/s/p 3:27:19 } +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1302/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.9004845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.42917 samples/s/p 3:27:28 } +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1304/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 1.8998799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43099 samples/s/p 3:27:21 } +2024-07-25 21:43:17,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1306/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 1.8992752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:17,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.44136 samples/s/p 3:26:54 } +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1308/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.8986706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43348 samples/s/p 3:27:09 } +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1310/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 1.8980661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:23,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42823 samples/s/p 3:27:18 } +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1312/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.8974612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43805 samples/s/p 3:26:53 } +2024-07-25 21:43:29,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1314/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.8968563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:29,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43583 samples/s/p 3:26:55 } +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1316/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8962515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42853 samples/s/p 3:27:09 } +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1318/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.8956465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43641 samples/s/p 3:26:48 } +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1320/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.8950414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43043 samples/s/p 3:26:58 } +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1322/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.8944364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:41,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43284 samples/s/p 3:26:50 } +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1324/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8938314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:44,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42923 samples/s/p 3:26:55 } +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1326/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.8932262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42966 samples/s/p 3:26:51 } +2024-07-25 21:43:50,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1328/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.8926208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:50,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43194 samples/s/p 3:26:43 } +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.8920155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44130 samples/s/p 3:26:19 } +2024-07-25 21:43:56,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1332/ 1625], loss: 1.164, per_step_time: 1474ms, lr: 1.8914103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:56,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42679 samples/s/p 3:26:49 } +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1334/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.8908046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44073 samples/s/p 3:26:14 } +2024-07-25 21:44:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1336/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 1.890199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43918 samples/s/p 3:26:15 } +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1338/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 1.8895937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:04,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43346 samples/s/p 3:26:25 } +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1340/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.888988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43201 samples/s/p 3:26:25 } +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1342/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.888382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43824 samples/s/p 3:26:08 } +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1344/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.8877763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43350 samples/s/p 3:26:16 } +2024-07-25 21:44:16,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.8871706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:16,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43299 samples/s/p 3:26:14 } +2024-07-25 21:44:19,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1348/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.8865647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43088 samples/s/p 3:26:16 } +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1350/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.8859586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43649 samples/s/p 3:26:00 } +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1352/ 1625], loss: 1.028, per_step_time: 1474ms, lr: 1.8853527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42690 samples/s/p 3:26:19 } +2024-07-25 21:44:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1354/ 1625], loss: 0.906, per_step_time: 1472ms, lr: 1.8847466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:28,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43397 samples/s/p 3:26:00 } +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1356/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 1.8841405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42968 samples/s/p 3:26:07 } +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1358/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.883534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43297 samples/s/p 3:25:57 } +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1360/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.882928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43450 samples/s/p 3:25:50 } +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1362/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.8823217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43521 samples/s/p 3:25:46 } +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1364/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.8817153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:43,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43549 samples/s/p 3:25:42 } +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1366/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8811088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.42868 samples/s/p 3:25:55 } +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1368/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.8805022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43445 samples/s/p 3:25:39 } +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1370/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.8798957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43872 samples/s/p 3:25:26 } +2024-07-25 21:44:55,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1372/ 1625], loss: 1.286, per_step_time: 1469ms, lr: 1.8792889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:55,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.44295 samples/s/p 3:25:13 } +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1374/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.8786823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43605 samples/s/p 3:25:26 } +2024-07-25 21:45:01,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1376/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.8780756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:01,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43078 samples/s/p 3:25:35 } +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1378/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 1.8774688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:03,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43831 samples/s/p 3:25:15 } +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1380/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 1.8768616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43661 samples/s/p 3:25:16 } +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1382/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 1.876255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43352 samples/s/p 3:25:20 } +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1384/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.875648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43814 samples/s/p 3:25:07 } +2024-07-25 21:45:15,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1386/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 1.8750408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:15,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43282 samples/s/p 3:25:16 } +2024-07-25 21:45:18,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1388/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.8744337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:18,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43274 samples/s/p 3:25:13 } +2024-07-25 21:45:21,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1390/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8738265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:21,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43325 samples/s/p 3:25:09 } +2024-07-25 21:45:24,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1392/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.8732191e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:24,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43310 samples/s/p 3:25:06 } +2024-07-25 21:45:27,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1394/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.872612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43823 samples/s/p 3:24:52 } +2024-07-25 21:45:30,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1396/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 1.8720046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:30,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43173 samples/s/p 3:25:04 } +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1398/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.8713974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43241 samples/s/p 3:24:59 } +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1400/ 1625], loss: 1.313, per_step_time: 1473ms, lr: 1.8707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43084 samples/s/p 3:25:00 } +2024-07-25 21:45:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1402/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.870182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43421 samples/s/p 3:24:49 } +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1404/ 1625], loss: 0.955, per_step_time: 1470ms, lr: 1.8695746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.44076 samples/s/p 3:24:31 } +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1406/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 1.8689669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.42951 samples/s/p 3:24:54 } +2024-07-25 21:45:48,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1408/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.8683593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:48,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43334 samples/s/p 3:24:42 } +2024-07-25 21:45:51,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1410/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.8677512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43923 samples/s/p 3:24:26 } +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.8671435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43381 samples/s/p 3:24:35 } +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1414/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.8665356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43239 samples/s/p 3:24:35 } +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.8659277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43681 samples/s/p 3:24:23 } +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1418/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.8653196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:03,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43029 samples/s/p 3:24:34 } +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1420/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.8647115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43731 samples/s/p 3:24:16 } +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.8641036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43088 samples/s/p 3:24:27 } +2024-07-25 21:46:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1424/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8634952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:11,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43794 samples/s/p 3:24:08 } +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1426/ 1625], loss: 0.986, per_step_time: 1473ms, lr: 1.862887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42822 samples/s/p 3:24:27 } +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1474ms, lr: 1.8622788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42645 samples/s/p 3:24:28 } +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1430/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.8616704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43189 samples/s/p 3:24:13 } +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1432/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.861062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43485 samples/s/p 3:24:03 } +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1434/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.8604534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43517 samples/s/p 3:24:00 } +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1436/ 1625], loss: 0.952, per_step_time: 1473ms, lr: 1.859845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43058 samples/s/p 3:24:07 } +2024-07-25 21:46:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1438/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 1.8592364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43064 samples/s/p 3:24:04 } +2024-07-25 21:46:35,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1440/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8586277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:35,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43306 samples/s/p 3:23:56 } +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1442/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.858019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:38,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43671 samples/s/p 3:23:45 } +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1444/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.8574103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43350 samples/s/p 3:23:49 } +2024-07-25 21:46:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1446/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.8568015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44081 samples/s/p 3:23:29 } +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1448/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.8561926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44008 samples/s/p 3:23:28 } +2024-07-25 21:46:50,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1450/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.8555837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:50,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43441 samples/s/p 3:23:38 } +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1452/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 1.8549747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43473 samples/s/p 3:23:34 } +2024-07-25 21:46:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1454/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8543657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43899 samples/s/p 3:23:22 } +2024-07-25 21:46:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1456/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.8537567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:59,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43350 samples/s/p 3:23:31 } +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1458/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.8531473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43396 samples/s/p 3:23:27 } +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1460/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.8525381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43832 samples/s/p 3:23:14 } +2024-07-25 21:47:07,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1462/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.8519288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43714 samples/s/p 3:23:14 } +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1464/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.8513196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:10,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43668 samples/s/p 3:23:12 } +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1466/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.8507104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43685 samples/s/p 3:23:09 } +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1468/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.8501007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.44429 samples/s/p 3:22:49 } +2024-07-25 21:47:19,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1470/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.8494913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:19,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43727 samples/s/p 3:23:02 } +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1472/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.8488818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:22,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43179 samples/s/p 3:23:11 } +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1474/ 1625], loss: 1.323, per_step_time: 1469ms, lr: 1.848272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:25,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44321 samples/s/p 3:22:43 } +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1476/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.8476625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43310 samples/s/p 3:23:03 } +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1478/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 1.8470528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.42960 samples/s/p 3:23:07 } +2024-07-25 21:47:34,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1480/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 1.846443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:34,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43091 samples/s/p 3:23:02 } +2024-07-25 21:47:37,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1482/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.8458331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44150 samples/s/p 3:22:35 } +2024-07-25 21:47:40,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1484/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.8452232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:40,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43664 samples/s/p 3:22:43 } +2024-07-25 21:47:43,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1486/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.8446133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:43,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43115 samples/s/p 3:22:52 } +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1488/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.8440034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43701 samples/s/p 3:22:36 } +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1490/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 1.8433933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.42699 samples/s/p 3:22:56 } +2024-07-25 21:47:52,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1492/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.8427832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:52,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43834 samples/s/p 3:22:27 } +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1494/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.8421732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:55,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43648 samples/s/p 3:22:29 } +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1496/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.841563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43885 samples/s/p 3:22:20 } +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1498/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.8409528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43691 samples/s/p 3:22:22 } +2024-07-25 21:48:04,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1500/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.8403425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:04,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43464 samples/s/p 3:22:24 } +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1502/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.839732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43452 samples/s/p 3:22:21 } +2024-07-25 21:48:09,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1504/ 1625], loss: 1.385, per_step_time: 1473ms, lr: 1.8391216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:09,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43060 samples/s/p 3:22:27 } +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1506/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8385112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44107 samples/s/p 3:22:01 } +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1508/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.8379005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43695 samples/s/p 3:22:07 } +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1510/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.8372903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43870 samples/s/p 3:22:00 } +2024-07-25 21:48:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1512/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8366794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43383 samples/s/p 3:22:08 } +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1514/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.8360686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.42973 samples/s/p 3:22:14 } +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1516/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 1.8354582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44149 samples/s/p 3:21:45 } +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.8348474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43253 samples/s/p 3:22:02 } +2024-07-25 21:48:33,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1520/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.8342364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:33,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43764 samples/s/p 3:21:48 } +2024-07-25 21:48:36,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1522/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.8336255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43613 samples/s/p 3:21:48 } +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1524/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.8330145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43513 samples/s/p 3:21:47 } +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1526/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.8324039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43718 samples/s/p 3:21:40 } +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1528/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.8317924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43445 samples/s/p 3:21:43 } +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1530/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 1.8311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43556 samples/s/p 3:21:38 } +2024-07-25 21:48:51,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1532/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.8305704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:51,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43746 samples/s/p 3:21:30 } +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1534/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 1.8299592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:54,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.44181 samples/s/p 3:21:18 } +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1536/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.8293478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43813 samples/s/p 3:21:23 } +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1538/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 1.8287366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43707 samples/s/p 3:21:22 } +2024-07-25 21:49:03,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1540/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 1.8281251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43118 samples/s/p 3:21:33 } +2024-07-25 21:49:05,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1542/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.8275137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:05,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43495 samples/s/p 3:21:21 } +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1544/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.8269022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43420 samples/s/p 3:21:20 } +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1546/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.8262908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43435 samples/s/p 3:21:17 } +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1548/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 1.8256795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43135 samples/s/p 3:21:20 } +2024-07-25 21:49:17,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1550/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.8250676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:17,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43325 samples/s/p 3:21:13 } +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1552/ 1625], loss: 0.950, per_step_time: 1470ms, lr: 1.824456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44109 samples/s/p 3:20:53 } +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1554/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.8238445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43459 samples/s/p 3:21:04 } +2024-07-25 21:49:26,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1556/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.8232326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:26,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43433 samples/s/p 3:21:02 } +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1558/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.8226207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43224 samples/s/p 3:21:04 } +2024-07-25 21:49:32,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1560/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.822009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:32,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43763 samples/s/p 3:20:49 } +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1562/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 1.8213968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43564 samples/s/p 3:20:50 } +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1564/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 1.820785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:38,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.42812 samples/s/p 3:21:04 } +2024-07-25 21:49:41,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1566/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.8201728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:41,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43421 samples/s/p 3:20:48 } +2024-07-25 21:49:44,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1568/ 1625], loss: 1.305, per_step_time: 1469ms, lr: 1.8195607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44228 samples/s/p 3:20:27 } +2024-07-25 21:49:47,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1570/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.8189487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:47,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43649 samples/s/p 3:20:37 } +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1572/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8183366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43191 samples/s/p 3:20:44 } +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1574/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.8177245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43348 samples/s/p 3:20:37 } +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1576/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 1.8171122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43393 samples/s/p 3:20:34 } +2024-07-25 21:49:59,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1578/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 1.8165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:59,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43778 samples/s/p 3:20:22 } +2024-07-25 21:50:02,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1580/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 1.8158873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:02,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43845 samples/s/p 3:20:18 } +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1582/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 1.815275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.44014 samples/s/p 3:20:11 } +2024-07-25 21:50:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1584/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.8146626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:07,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43694 samples/s/p 3:20:15 } +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1586/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.8140501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43932 samples/s/p 3:20:07 } +2024-07-25 21:50:13,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1588/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.8134375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43061 samples/s/p 3:20:23 } +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1590/ 1625], loss: 1.226, per_step_time: 1469ms, lr: 1.8128248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.44286 samples/s/p 3:19:53 } +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1592/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 1.8122122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43853 samples/s/p 3:20:00 } +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1594/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 1.8115996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43352 samples/s/p 3:20:08 } +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1596/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.8109868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43451 samples/s/p 3:20:03 } +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1598/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 1.8103741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43497 samples/s/p 3:19:59 } +2024-07-25 21:50:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1600/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.8097613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43114 samples/s/p 3:20:04 } +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1602/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.8091481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43378 samples/s/p 3:19:56 } +2024-07-25 21:50:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1604/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8085353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43451 samples/s/p 3:19:51 } +2024-07-25 21:50:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1606/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.8079225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:40,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43609 samples/s/p 3:19:45 } +2024-07-25 21:50:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1608/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8073093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43533 samples/s/p 3:19:43 } +2024-07-25 21:50:46,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1610/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.8066961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:46,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43786 samples/s/p 3:19:35 } +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1612/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.8060831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43592 samples/s/p 3:19:36 } +2024-07-25 21:50:52,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1614/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.8054698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:52,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43735 samples/s/p 3:19:30 } +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1616/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.8048568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43347 samples/s/p 3:19:36 } +2024-07-25 21:50:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1618/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.8042434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43387 samples/s/p 3:19:32 } +2024-07-25 21:51:01,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1620/ 1625], loss: 1.042, per_step_time: 1469ms, lr: 1.8036299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:01,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44229 samples/s/p 3:19:10 } +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1622/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8030169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43364 samples/s/p 3:19:26 } +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1624/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 1.8024031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44216 samples/s/p 3:19:05 } +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.80179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43659 samples/s/p 3:19:14 } +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 3/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.8011764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:12,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43627 samples/s/p 3:19:12 } +2024-07-25 21:51:15,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 5/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.8005629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43261 samples/s/p 3:19:17 } +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 7/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7999491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43744 samples/s/p 3:19:03 } +2024-07-25 21:51:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 9/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.7993356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:21,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43347 samples/s/p 3:19:09 } +2024-07-25 21:51:24,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 11/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.7987217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:24,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.44216 samples/s/p 3:18:47 } +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 13/ 1625], loss: 1.056, per_step_time: 1475ms, lr: 1.798108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42204 samples/s/p 3:19:28 } +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 15/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.7974944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43328 samples/s/p 3:19:01 } +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 17/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.7968803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43832 samples/s/p 3:18:47 } +2024-07-25 21:51:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 19/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.7962668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:36,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43007 samples/s/p 3:19:02 } +2024-07-25 21:51:39,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 21/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.7956525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43836 samples/s/p 3:18:41 } +2024-07-25 21:51:42,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 23/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 1.7950388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:42,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43549 samples/s/p 3:18:44 } +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 25/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.7944249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43727 samples/s/p 3:18:37 } +2024-07-25 21:51:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 27/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7938106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43920 samples/s/p 3:18:30 } +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 29/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7931965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43442 samples/s/p 3:18:38 } +2024-07-25 21:51:54,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 31/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.7925824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:54,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43370 samples/s/p 3:18:36 } +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 33/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.7919681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:57,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43113 samples/s/p 3:18:39 } +2024-07-25 21:52:00,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 35/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.7913539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:00,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43220 samples/s/p 3:18:34 } +2024-07-25 21:52:03,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 37/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7907396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:03,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43075 samples/s/p 3:18:34 } +2024-07-25 21:52:05,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 39/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 1.7901253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:05,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43440 samples/s/p 3:18:23 } +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 41/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.789511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43421 samples/s/p 3:18:20 } +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 43/ 1625], loss: 1.354, per_step_time: 1470ms, lr: 1.7888964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44199 samples/s/p 3:18:00 } +2024-07-25 21:52:14,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 45/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 1.788282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:14,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44007 samples/s/p 3:18:02 } +2024-07-25 21:52:17,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 47/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.7876677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:17,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43251 samples/s/p 3:18:15 } +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 49/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.787053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43568 samples/s/p 3:18:05 } +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 51/ 1625], loss: 1.256, per_step_time: 1474ms, lr: 1.7864384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.42596 samples/s/p 3:18:24 } +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 53/ 1625], loss: 1.194, per_step_time: 1469ms, lr: 1.7858238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44577 samples/s/p 3:17:38 } +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 55/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7852091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:29,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43390 samples/s/p 3:18:00 } +2024-07-25 21:52:32,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 57/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7845947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43626 samples/s/p 3:17:52 } +2024-07-25 21:52:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 59/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.7839797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43101 samples/s/p 3:18:01 } +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 61/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 1.7833649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.42857 samples/s/p 3:18:03 } +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 63/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.78275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43087 samples/s/p 3:17:55 } +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 65/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.7821352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43864 samples/s/p 3:17:35 } +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 67/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.78152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43817 samples/s/p 3:17:33 } +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 69/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.7809052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43677 samples/s/p 3:17:34 } +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 71/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.7802902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43852 samples/s/p 3:17:27 } +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 73/ 1625], loss: 1.242, per_step_time: 1482ms, lr: 1.7796752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:56,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.39697 samples/s/p 3:18:55 } +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 75/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.77906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43943 samples/s/p 3:17:19 } +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 77/ 1625], loss: 0.873, per_step_time: 1470ms, lr: 1.7784449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44181 samples/s/p 3:17:11 } +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 79/ 1625], loss: 1.275, per_step_time: 1470ms, lr: 1.7778299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43935 samples/s/p 3:17:13 } +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 81/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 1.7772145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44320 samples/s/p 3:17:02 } +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 83/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 1.7765991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43899 samples/s/p 3:17:08 } +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 85/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.775984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43407 samples/s/p 3:17:16 } +2024-07-25 21:53:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 87/ 1625], loss: 1.158, per_step_time: 1469ms, lr: 1.7753686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44298 samples/s/p 3:16:54 } +2024-07-25 21:53:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 89/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.774753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:19,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43362 samples/s/p 3:17:11 } +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 91/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 1.7741377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.44254 samples/s/p 3:16:49 } +2024-07-25 21:53:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 93/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.7735223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:25,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43392 samples/s/p 3:17:04 } +2024-07-25 21:53:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 95/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.7729066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43283 samples/s/p 3:17:04 } +2024-07-25 21:53:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 97/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.772291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43116 samples/s/p 3:17:05 } +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 99/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.7716755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43154 samples/s/p 3:17:01 } +2024-07-25 21:53:37,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 101/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.77106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43757 samples/s/p 3:16:45 } +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 103/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.7704442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43724 samples/s/p 3:16:43 } +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 105/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 1.7698285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:43,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43416 samples/s/p 3:16:46 } +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 107/ 1625], loss: 1.169, per_step_time: 1469ms, lr: 1.7692128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.44233 samples/s/p 3:16:26 } +2024-07-25 21:53:49,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 109/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.768597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43843 samples/s/p 3:16:31 } +2024-07-25 21:53:52,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 111/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 1.767981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:52,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43490 samples/s/p 3:16:36 } +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 113/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 1.7673652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43579 samples/s/p 3:16:31 } +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 115/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7667493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.42934 samples/s/p 3:16:42 } +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 117/ 1625], loss: 1.038, per_step_time: 1473ms, lr: 1.7661332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43062 samples/s/p 3:16:36 } +2024-07-25 21:54:03,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 119/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.7655173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43446 samples/s/p 3:16:25 } +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 121/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.764901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.42991 samples/s/p 3:16:32 } +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 123/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7642853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43103 samples/s/p 3:16:27 } +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.763669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43035 samples/s/p 3:16:25 } +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 127/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.7630528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:15,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43804 samples/s/p 3:16:06 } +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 129/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7624367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:18,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43156 samples/s/p 3:16:17 } +2024-07-25 21:54:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 131/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.7618206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43326 samples/s/p 3:16:10 } +2024-07-25 21:54:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 133/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.761204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.42884 samples/s/p 3:16:17 } +2024-07-25 21:54:27,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 135/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7605877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43410 samples/s/p 3:16:02 } +2024-07-25 21:54:30,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 137/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.7599716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:30,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43127 samples/s/p 3:16:05 } +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 139/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.759355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43756 samples/s/p 3:15:49 } +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 141/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.7587385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43824 samples/s/p 3:15:44 } +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 143/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7581222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43609 samples/s/p 3:15:46 } +2024-07-25 21:54:42,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 145/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.7575056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43767 samples/s/p 3:15:40 } +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 147/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.756889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43416 samples/s/p 3:15:44 } +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 149/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.7562725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:48,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43646 samples/s/p 3:15:37 } +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 151/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.7556558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43556 samples/s/p 3:15:36 } +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 153/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.7550392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:54,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43772 samples/s/p 3:15:28 } +2024-07-25 21:54:57,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 155/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.7544224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:57,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43282 samples/s/p 3:15:36 } +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 157/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 1.7538056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.41690 samples/s/p 3:16:07 } +2024-07-25 21:55:03,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 159/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.753189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43757 samples/s/p 3:15:19 } +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 161/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.7525721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43252 samples/s/p 3:15:27 } +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 163/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.7519553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43543 samples/s/p 3:15:18 } +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 165/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7513383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43710 samples/s/p 3:15:12 } +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 167/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.7507215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43071 samples/s/p 3:15:22 } +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 169/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.7501043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43336 samples/s/p 3:15:14 } +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 171/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7494875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43404 samples/s/p 3:15:09 } +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 173/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.7488705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43568 samples/s/p 3:15:03 } +2024-07-25 21:55:26,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 175/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.7482535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:26,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.44292 samples/s/p 3:14:44 } +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 177/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.7476359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43321 samples/s/p 3:15:02 } +2024-07-25 21:55:32,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 179/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.747019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42860 samples/s/p 3:15:09 } +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 181/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.7464017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43202 samples/s/p 3:14:59 } +2024-07-25 21:55:38,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 183/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.7457845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:38,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43585 samples/s/p 3:14:48 } +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 185/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 1.7451674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42576 samples/s/p 3:15:07 } +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 187/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.74455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43267 samples/s/p 3:14:49 } +2024-07-25 21:55:47,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 189/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 1.7439326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:47,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43735 samples/s/p 3:14:36 } +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 191/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.7433153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43874 samples/s/p 3:14:30 } +2024-07-25 21:55:53,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 193/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7426979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:53,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43314 samples/s/p 3:14:39 } +2024-07-25 21:55:56,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 195/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.7420805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:56,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43674 samples/s/p 3:14:28 } +2024-07-25 21:55:59,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 197/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.741463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:59,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44049 samples/s/p 3:14:17 } +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 199/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.7408454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43503 samples/s/p 3:14:26 } +2024-07-25 21:56:05,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 201/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.740228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:05,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43221 samples/s/p 3:14:29 } +2024-07-25 21:56:07,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 203/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.7396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:07,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44093 samples/s/p 3:14:08 } +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 205/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.7389928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.42987 samples/s/p 3:14:28 } +2024-07-25 21:56:13,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 207/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7383752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:13,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43563 samples/s/p 3:14:13 } +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 209/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.7377573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43716 samples/s/p 3:14:07 } +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 211/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.7371396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43168 samples/s/p 3:14:16 } +2024-07-25 21:56:22,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 213/ 1625], loss: 1.324, per_step_time: 1473ms, lr: 1.7365219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:22,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43102 samples/s/p 3:14:14 } +2024-07-25 21:56:25,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 215/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 1.735904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:25,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43522 samples/s/p 3:14:02 } +2024-07-25 21:56:28,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 217/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.7352862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:28,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43058 samples/s/p 3:14:09 } +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 219/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7346685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43506 samples/s/p 3:13:57 } +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 221/ 1625], loss: 1.076, per_step_time: 1473ms, lr: 1.7340506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42898 samples/s/p 3:14:07 } +2024-07-25 21:56:37,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 223/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.7334327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:37,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43362 samples/s/p 3:13:54 } +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 225/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.7328146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:40,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43872 samples/s/p 3:13:40 } +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 227/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.7321967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:43,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42395 samples/s/p 3:14:09 } +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 229/ 1625], loss: 0.899, per_step_time: 1471ms, lr: 1.7315788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:46,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43566 samples/s/p 3:13:41 } +2024-07-25 21:56:49,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 231/ 1625], loss: 0.989, per_step_time: 1469ms, lr: 1.7309607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:49,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.44375 samples/s/p 3:13:20 } +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 233/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7303424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43740 samples/s/p 3:13:31 } +2024-07-25 21:56:55,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 235/ 1625], loss: 1.290, per_step_time: 1470ms, lr: 1.7297245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:55,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43882 samples/s/p 3:13:25 } +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 237/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.729106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43985 samples/s/p 3:13:20 } +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 239/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.728488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43124 samples/s/p 3:13:35 } +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 241/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.7278699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43285 samples/s/p 3:13:29 } +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 243/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.7272516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43349 samples/s/p 3:13:25 } +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 245/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.7266331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43908 samples/s/p 3:13:10 } +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 247/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7260149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:12,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44178 samples/s/p 3:13:01 } +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 249/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.7253966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43756 samples/s/p 3:13:07 } +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 251/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.7247781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44205 samples/s/p 3:12:55 } +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 253/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.7241597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:21,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43172 samples/s/p 3:13:14 } +2024-07-25 21:57:24,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 255/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.7235412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44012 samples/s/p 3:12:53 } +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 257/ 1625], loss: 1.069, per_step_time: 1474ms, lr: 1.722923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.42480 samples/s/p 3:13:23 } +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 259/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 1.7223043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44003 samples/s/p 3:12:47 } +2024-07-25 21:57:33,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 261/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.7216857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:33,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43223 samples/s/p 3:13:01 } +2024-07-25 21:57:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 263/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 1.7210672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:36,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43810 samples/s/p 3:12:45 } +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 265/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.7204486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43811 samples/s/p 3:12:42 } +2024-07-25 21:57:42,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 267/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.7198297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:42,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43342 samples/s/p 3:12:49 } +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 269/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.7192113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43710 samples/s/p 3:12:39 } +2024-07-25 21:57:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 271/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 1.7185926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:48,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43416 samples/s/p 3:12:42 } +2024-07-25 21:57:51,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 273/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 1.7179738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43795 samples/s/p 3:12:31 } +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 275/ 1625], loss: 1.379, per_step_time: 1470ms, lr: 1.717355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43857 samples/s/p 3:12:27 } +2024-07-25 21:57:54,186 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 277/ 1625], loss: 1.121, per_step_time: 1884ms, lr: 1.7167362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 4.24524 samples/s/p 4:06:29 } +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 279/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.7161175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43018 samples/s/p 3:12:39 } +2024-07-25 21:58:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 281/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.7154985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:36,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43682 samples/s/p 3:12:22 } +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 283/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.7148795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43746 samples/s/p 3:12:17 } +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 285/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.7142607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44082 samples/s/p 3:12:07 } +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 287/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.7136417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43243 samples/s/p 3:12:22 } +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 289/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.7130225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43818 samples/s/p 3:12:07 } +2024-07-25 21:58:50,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 291/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.7124037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:50,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43367 samples/s/p 3:12:14 } +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 293/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 1.7117847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:53,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44100 samples/s/p 3:11:55 } +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 295/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 1.7111655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43898 samples/s/p 3:11:56 } +2024-07-25 21:58:59,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 297/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.7105465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:59,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43715 samples/s/p 3:11:57 } +2024-07-25 21:59:02,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 299/ 1625], loss: 0.974, per_step_time: 1471ms, lr: 1.7099273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:02,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43509 samples/s/p 3:11:59 } +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 301/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 1.7093083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44065 samples/s/p 3:11:44 } +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 303/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.708689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43523 samples/s/p 3:11:53 } +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 305/ 1625], loss: 1.362, per_step_time: 1469ms, lr: 1.7080698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44529 samples/s/p 3:11:28 } +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 307/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.7074506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43671 samples/s/p 3:11:44 } +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 309/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.7068312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43506 samples/s/p 3:11:44 } +2024-07-25 21:59:20,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 311/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.7062119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:20,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43901 samples/s/p 3:11:33 } +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 313/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.7055927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:23,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43658 samples/s/p 3:11:35 } +2024-07-25 21:59:26,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 315/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 1.7049733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:26,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43260 samples/s/p 3:11:40 } +2024-07-25 21:59:29,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 317/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.704354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:29,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43231 samples/s/p 3:11:38 } +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 319/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 1.7037344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43987 samples/s/p 3:11:19 } +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1474ms, lr: 1.703115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.42615 samples/s/p 3:11:45 } +2024-07-25 21:59:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 323/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.7024955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43389 samples/s/p 3:11:26 } +2024-07-25 21:59:41,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 325/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 1.701876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:41,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43864 samples/s/p 3:11:13 } +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 327/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.7012564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43606 samples/s/p 3:11:15 } +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 329/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.7006369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43983 samples/s/p 3:11:05 } +2024-07-25 21:59:49,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 331/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.7000175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:49,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43393 samples/s/p 3:11:14 } +2024-07-25 21:59:52,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 333/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.6993976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:52,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43618 samples/s/p 3:11:06 } +2024-07-25 21:59:55,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 335/ 1625], loss: 1.087, per_step_time: 1470ms, lr: 1.698778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:55,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43919 samples/s/p 3:10:57 } +2024-07-25 21:59:58,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 337/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 1.6981583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:58,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.44027 samples/s/p 3:10:52 } +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 339/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.6975388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43635 samples/s/p 3:10:57 } +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 341/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.6969188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43831 samples/s/p 3:10:50 } +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 343/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.6962991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43706 samples/s/p 3:10:50 } +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 345/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.6956794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:10,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43945 samples/s/p 3:10:42 } +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 347/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6950595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43324 samples/s/p 3:10:52 } +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 349/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.6944396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43803 samples/s/p 3:10:39 } +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 351/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.69382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43844 samples/s/p 3:10:35 } +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 353/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.6932001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43335 samples/s/p 3:10:43 } +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 355/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.69258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43782 samples/s/p 3:10:31 } +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 357/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.6919603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:28,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43432 samples/s/p 3:10:35 } +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 359/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.6913402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43702 samples/s/p 3:10:26 } +2024-07-25 22:00:34,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 361/ 1625], loss: 1.336, per_step_time: 1471ms, lr: 1.6907201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:34,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43629 samples/s/p 3:10:25 } +2024-07-25 22:00:37,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 363/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.6901002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:37,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43856 samples/s/p 3:10:17 } +2024-07-25 22:00:40,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 365/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.68948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:40,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43557 samples/s/p 3:10:21 } +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 367/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.68886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43273 samples/s/p 3:10:24 } +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 369/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.6882399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43482 samples/s/p 3:10:16 } +2024-07-25 22:00:48,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 371/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.6876196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:48,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43587 samples/s/p 3:10:11 } +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 373/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 1.6869997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42471 samples/s/p 3:10:32 } +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 375/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.6863796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42826 samples/s/p 3:10:21 } +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 377/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.6857595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43738 samples/s/p 3:09:59 } +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 379/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.685139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43139 samples/s/p 3:10:09 } +2024-07-25 22:01:03,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 381/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.6845188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:03,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43539 samples/s/p 3:09:57 } +2024-07-25 22:01:06,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 383/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.6838985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:06,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43103 samples/s/p 3:10:04 } +2024-07-25 22:01:09,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 385/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.6832782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:09,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42912 samples/s/p 3:10:05 } +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 387/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.682658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:12,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42757 samples/s/p 3:10:05 } +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 389/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.6820375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43571 samples/s/p 3:09:45 } +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 391/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.6814174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43261 samples/s/p 3:09:49 } +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 393/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.6807968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43823 samples/s/p 3:09:34 } +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 395/ 1625], loss: 1.084, per_step_time: 1479ms, lr: 1.6801763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.40865 samples/s/p 3:10:33 } +2024-07-25 22:01:27,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 397/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.679556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:27,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43650 samples/s/p 3:09:32 } +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 399/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.6789356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43628 samples/s/p 3:09:29 } +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 401/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.678315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:33,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43290 samples/s/p 3:09:33 } +2024-07-25 22:01:36,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 403/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 1.6776945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:36,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43994 samples/s/p 3:09:16 } +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 405/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.6770739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.44095 samples/s/p 3:09:10 } +2024-07-25 22:01:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 407/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.6764534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43392 samples/s/p 3:09:22 } +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 409/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6758328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43562 samples/s/p 3:09:16 } +2024-07-25 22:01:48,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 411/ 1625], loss: 1.214, per_step_time: 1483ms, lr: 1.6752121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:48,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.39162 samples/s/p 3:10:45 } +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 413/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.6745917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43760 samples/s/p 3:09:06 } +2024-07-25 22:01:53,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 415/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.6739708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:53,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43437 samples/s/p 3:09:09 } +2024-07-25 22:01:56,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 417/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.6733502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:56,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43996 samples/s/p 3:08:55 } +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 419/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.6727296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42987 samples/s/p 3:09:13 } +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 421/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.672109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43463 samples/s/p 3:09:00 } +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 423/ 1625], loss: 1.291, per_step_time: 1474ms, lr: 1.671488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42602 samples/s/p 3:09:15 } +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 425/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.6708673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:08,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43715 samples/s/p 3:08:49 } +2024-07-25 22:02:11,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 427/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.6702465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:11,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43802 samples/s/p 3:08:44 } +2024-07-25 22:02:14,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 429/ 1625], loss: 1.089, per_step_time: 1473ms, lr: 1.6696256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:14,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42990 samples/s/p 3:08:58 } +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 431/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 1.6690048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:17,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.42551 samples/s/p 3:09:04 } +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 433/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.6683838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43178 samples/s/p 3:08:48 } +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 435/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 1.6677632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43533 samples/s/p 3:08:38 } +2024-07-25 22:02:26,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 437/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.6671422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:26,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43319 samples/s/p 3:08:40 } +2024-07-25 22:02:29,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 439/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.6665212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:29,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43162 samples/s/p 3:08:40 } +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.6659005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43525 samples/s/p 3:08:29 } +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 443/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6652793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:35,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43432 samples/s/p 3:08:28 } +2024-07-25 22:02:38,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 445/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.6646582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43604 samples/s/p 3:08:22 } +2024-07-25 22:02:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 447/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.6640375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43183 samples/s/p 3:08:28 } +2024-07-25 22:02:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 449/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6634163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43244 samples/s/p 3:08:23 } +2024-07-25 22:02:47,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 451/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.6627953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:47,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43661 samples/s/p 3:08:12 } +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 453/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.6621743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:50,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43132 samples/s/p 3:08:20 } +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 455/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.661553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43691 samples/s/p 3:08:05 } +2024-07-25 22:02:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 457/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 1.6609321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:55,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43611 samples/s/p 3:08:04 } +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 459/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 1.6603108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43386 samples/s/p 3:08:06 } +2024-07-25 22:03:01,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 461/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.6596896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:01,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.44322 samples/s/p 3:07:43 } +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 463/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6590686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43558 samples/s/p 3:07:56 } +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 465/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 1.6584474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.42932 samples/s/p 3:08:06 } +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 467/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.657826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43517 samples/s/p 3:07:51 } +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 469/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.6572048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43842 samples/s/p 3:07:42 } +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 471/ 1625], loss: 1.016, per_step_time: 1473ms, lr: 1.6565837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:16,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43026 samples/s/p 3:07:56 } +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 473/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.6559625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43168 samples/s/p 3:07:50 } +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 475/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.6553411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43426 samples/s/p 3:07:41 } +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 477/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.6547197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43510 samples/s/p 3:07:37 } +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 479/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.6540986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43655 samples/s/p 3:07:31 } +2024-07-25 22:03:31,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 481/ 1625], loss: 1.252, per_step_time: 1477ms, lr: 1.653477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:31,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.41524 samples/s/p 3:08:12 } +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 483/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.6528556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43190 samples/s/p 3:07:35 } +2024-07-25 22:03:37,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 485/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 1.6522345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43411 samples/s/p 3:07:27 } +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 487/ 1625], loss: 1.072, per_step_time: 1483ms, lr: 1.651613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.39103 samples/s/p 3:08:54 } +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 489/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.6509914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:43,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43284 samples/s/p 3:07:24 } +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 491/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.6503702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43725 samples/s/p 3:07:12 } +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 493/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 1.6497484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43841 samples/s/p 3:07:06 } +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 495/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.649127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43917 samples/s/p 3:07:02 } +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 497/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 1.6485055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43629 samples/s/p 3:07:05 } +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 499/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.6478842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43745 samples/s/p 3:06:59 } +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.6472628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.42397 samples/s/p 3:07:24 } +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 503/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.6466409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43972 samples/s/p 3:06:49 } +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 505/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.6460193e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:06,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43241 samples/s/p 3:07:01 } +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 507/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.645398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.44170 samples/s/p 3:06:39 } +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 509/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.6447762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:12,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43240 samples/s/p 3:06:55 } +2024-07-25 22:04:15,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 511/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.6441545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:15,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43298 samples/s/p 3:06:51 } +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 513/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 1.6435331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43687 samples/s/p 3:06:40 } +2024-07-25 22:04:21,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 515/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.6429112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43557 samples/s/p 3:06:40 } +2024-07-25 22:04:24,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 517/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.6422895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43168 samples/s/p 3:06:45 } +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 519/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.641668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43221 samples/s/p 3:06:41 } +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 521/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.6410462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43437 samples/s/p 3:06:33 } +2024-07-25 22:04:33,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 523/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.6404245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43367 samples/s/p 3:06:32 } +2024-07-25 22:04:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 525/ 1625], loss: 1.376, per_step_time: 1473ms, lr: 1.6398028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:36,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.42753 samples/s/p 3:06:42 } +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 527/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 1.639181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43055 samples/s/p 3:06:32 } +2024-07-25 22:04:42,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 529/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 1.6385593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44042 samples/s/p 3:06:09 } +2024-07-25 22:04:45,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 531/ 1625], loss: 1.436, per_step_time: 1472ms, lr: 1.6379374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:45,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43152 samples/s/p 3:06:25 } +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 533/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 1.6373155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:48,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44020 samples/s/p 3:06:04 } +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 535/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 1.6366937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43878 samples/s/p 3:06:04 } +2024-07-25 22:04:53,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 537/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.636072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:53,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44113 samples/s/p 3:05:56 } +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 539/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.6354501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43871 samples/s/p 3:05:58 } +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 541/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 1.6348282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43490 samples/s/p 3:06:03 } +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 543/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.6342063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:02,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43194 samples/s/p 3:06:06 } +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 545/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6335844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.44101 samples/s/p 3:05:44 } +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 547/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.6329626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43215 samples/s/p 3:06:00 } +2024-07-25 22:05:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 549/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.6323405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43595 samples/s/p 3:05:49 } +2024-07-25 22:05:14,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 551/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.6317186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:14,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43657 samples/s/p 3:05:45 } +2024-07-25 22:05:17,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 553/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 1.6310967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:17,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42490 samples/s/p 3:06:06 } +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 555/ 1625], loss: 1.357, per_step_time: 1471ms, lr: 1.6304746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43800 samples/s/p 3:05:36 } +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 557/ 1625], loss: 1.058, per_step_time: 1475ms, lr: 1.6298527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42181 samples/s/p 3:06:06 } +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 559/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.6292306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43589 samples/s/p 3:05:34 } +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 561/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.6286087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42800 samples/s/p 3:05:48 } +2024-07-25 22:05:32,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 563/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.6279866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:32,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43544 samples/s/p 3:05:29 } +2024-07-25 22:05:35,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 565/ 1625], loss: 0.905, per_step_time: 1471ms, lr: 1.6273645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43618 samples/s/p 3:05:25 } +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 567/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 1.6267424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42853 samples/s/p 3:05:38 } +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 569/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.6261205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43280 samples/s/p 3:05:26 } +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 571/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6254982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43850 samples/s/p 3:05:11 } +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 573/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.6248761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.44089 samples/s/p 3:05:04 } +2024-07-25 22:05:50,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 575/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.6242542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:50,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42658 samples/s/p 3:05:30 } +2024-07-25 22:05:53,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 577/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 1.623632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:53,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43199 samples/s/p 3:05:16 } +2024-07-25 22:05:55,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 579/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.6230098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:55,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43309 samples/s/p 3:05:11 } +2024-07-25 22:05:58,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 581/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.6223876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:58,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.42706 samples/s/p 3:05:20 } +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 583/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.6217655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43544 samples/s/p 3:05:00 } +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 585/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.6211432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43326 samples/s/p 3:05:01 } +2024-07-25 22:06:07,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 587/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6205211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:07,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43730 samples/s/p 3:04:50 } +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 589/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.6198988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:10,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43851 samples/s/p 3:04:45 } +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 591/ 1625], loss: 0.934, per_step_time: 1470ms, lr: 1.6192767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.44141 samples/s/p 3:04:36 } +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 593/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.6186543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:16,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43763 samples/s/p 3:04:41 } +2024-07-25 22:06:19,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.618032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43404 samples/s/p 3:04:45 } +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 597/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.6174099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:22,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43861 samples/s/p 3:04:33 } +2024-07-25 22:06:25,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 599/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.6167876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:25,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.44015 samples/s/p 3:04:27 } +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 601/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.6161654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43665 samples/s/p 3:04:31 } +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 603/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.6155429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43492 samples/s/p 3:04:32 } +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 605/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 1.6149206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43774 samples/s/p 3:04:23 } +2024-07-25 22:06:37,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 607/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.6142983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:37,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43435 samples/s/p 3:04:27 } +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 609/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.6136759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43335 samples/s/p 3:04:26 } +2024-07-25 22:06:43,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 611/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6130536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:43,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43953 samples/s/p 3:04:10 } +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 613/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.6124313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:46,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43130 samples/s/p 3:04:24 } +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 615/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.6118087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44096 samples/s/p 3:04:02 } +2024-07-25 22:06:52,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 617/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6111862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:52,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44092 samples/s/p 3:03:59 } +2024-07-25 22:06:54,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1475ms, lr: 1.6105641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:54,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42295 samples/s/p 3:04:32 } +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 621/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 1.6099417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42958 samples/s/p 3:04:16 } +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 623/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.609319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:00,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43458 samples/s/p 3:04:03 } +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 625/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.6086968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43397 samples/s/p 3:04:01 } +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 627/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.6080743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43610 samples/s/p 3:03:54 } +2024-07-25 22:07:09,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 629/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.6074518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:09,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43222 samples/s/p 3:03:59 } +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 631/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.6068294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43402 samples/s/p 3:03:52 } +2024-07-25 22:07:15,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 633/ 1625], loss: 1.459, per_step_time: 1472ms, lr: 1.606207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:15,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43381 samples/s/p 3:03:50 } +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 635/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.6055847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43180 samples/s/p 3:03:51 } +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 637/ 1625], loss: 1.307, per_step_time: 1475ms, lr: 1.6049618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42211 samples/s/p 3:04:08 } +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 639/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.6043394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42913 samples/s/p 3:03:50 } +2024-07-25 22:07:27,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 641/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.603717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:27,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43559 samples/s/p 3:03:34 } +2024-07-25 22:07:30,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 643/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.6030945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:30,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43481 samples/s/p 3:03:33 } +2024-07-25 22:07:33,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 645/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.6024716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:33,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43052 samples/s/p 3:03:39 } +2024-07-25 22:07:36,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 647/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.6018494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:36,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43477 samples/s/p 3:03:27 } +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 649/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.6012267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43159 samples/s/p 3:03:31 } +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.600604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43341 samples/s/p 3:03:24 } +2024-07-25 22:07:45,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 653/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 1.5999816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:45,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43177 samples/s/p 3:03:24 } +2024-07-25 22:07:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 655/ 1625], loss: 1.053, per_step_time: 1470ms, lr: 1.599359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:48,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.44194 samples/s/p 3:03:01 } +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 657/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.5987367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.44020 samples/s/p 3:03:01 } +2024-07-25 22:07:54,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 659/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5981137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43181 samples/s/p 3:03:15 } +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 661/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.597491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.44095 samples/s/p 3:02:54 } +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 663/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.5968686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43889 samples/s/p 3:02:55 } +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 665/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 1.596246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:02,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43344 samples/s/p 3:03:03 } +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 667/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.5956231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43499 samples/s/p 3:02:57 } +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 669/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.5950009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43664 samples/s/p 3:02:51 } +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 671/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.5943782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43841 samples/s/p 3:02:44 } +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 673/ 1625], loss: 1.216, per_step_time: 1473ms, lr: 1.5937554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.42877 samples/s/p 3:03:01 } +2024-07-25 22:08:17,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 675/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.5931328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:17,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43816 samples/s/p 3:02:39 } +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 677/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.59251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43358 samples/s/p 3:02:45 } +2024-07-25 22:08:23,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 679/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.5918875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:23,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43537 samples/s/p 3:02:39 } +2024-07-25 22:08:26,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 681/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.5912645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:26,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43849 samples/s/p 3:02:30 } +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 683/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 1.5906418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43632 samples/s/p 3:02:31 } +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 685/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.5900194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43115 samples/s/p 3:02:39 } +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 687/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5893967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43739 samples/s/p 3:02:23 } +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 689/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 1.5887737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43980 samples/s/p 3:02:15 } +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 691/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.5881511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:41,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43047 samples/s/p 3:02:31 } +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 693/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 1.5875283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43766 samples/s/p 3:02:14 } +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 695/ 1625], loss: 1.366, per_step_time: 1473ms, lr: 1.5869056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43003 samples/s/p 3:02:26 } +2024-07-25 22:08:50,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 697/ 1625], loss: 1.421, per_step_time: 1472ms, lr: 1.586283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:50,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43196 samples/s/p 3:02:19 } +2024-07-25 22:08:53,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 699/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.5856602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43111 samples/s/p 3:02:18 } +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 701/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.5850375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43374 samples/s/p 3:02:10 } +2024-07-25 22:08:58,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 703/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.5844147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:58,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43395 samples/s/p 3:02:06 } +2024-07-25 22:09:01,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 705/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.5837917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:01,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43642 samples/s/p 3:01:58 } +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 707/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.583169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42877 samples/s/p 3:02:11 } +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 709/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 1.5825464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:07,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42454 samples/s/p 3:02:16 } +2024-07-25 22:09:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 711/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.5819236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:10,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43273 samples/s/p 3:01:57 } +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 713/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.5813008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43217 samples/s/p 3:01:55 } +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 715/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5806778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43661 samples/s/p 3:01:43 } +2024-07-25 22:09:19,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 717/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.580055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:19,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43542 samples/s/p 3:01:43 } +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 719/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5794321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43400 samples/s/p 3:01:43 } +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 721/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.5788095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43850 samples/s/p 3:01:31 } +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 723/ 1625], loss: 1.309, per_step_time: 1473ms, lr: 1.5781865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42949 samples/s/p 3:01:46 } +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 725/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.5775639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:31,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43404 samples/s/p 3:01:34 } +2024-07-25 22:09:34,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 727/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.5769408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43671 samples/s/p 3:01:25 } +2024-07-25 22:09:37,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 729/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.576318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:37,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43626 samples/s/p 3:01:23 } +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 731/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.5756952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:40,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43878 samples/s/p 3:01:15 } +2024-07-25 22:09:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 733/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.5750724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:43,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43496 samples/s/p 3:01:20 } +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 735/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.5744496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43383 samples/s/p 3:01:19 } +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 737/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.5738266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43266 samples/s/p 3:01:19 } +2024-07-25 22:09:52,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 739/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.5732037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:52,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43953 samples/s/p 3:01:02 } +2024-07-25 22:09:55,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 741/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 1.5725807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:55,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.44055 samples/s/p 3:00:57 } +2024-07-25 22:09:57,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 743/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.5719581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43094 samples/s/p 3:01:14 } +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 745/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.571335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43249 samples/s/p 3:01:07 } +2024-07-25 22:10:03,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 747/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.5707124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42745 samples/s/p 3:01:15 } +2024-07-25 22:10:06,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 749/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5700893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43811 samples/s/p 3:00:50 } +2024-07-25 22:10:09,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 751/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.5694664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:09,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43662 samples/s/p 3:00:50 } +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 753/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.5688438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42770 samples/s/p 3:01:05 } +2024-07-25 22:10:15,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 755/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.5682208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:15,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43399 samples/s/p 3:00:50 } +2024-07-25 22:10:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 757/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 1.5675978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43126 samples/s/p 3:00:52 } +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 759/ 1625], loss: 1.211, per_step_time: 1474ms, lr: 1.5669748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42479 samples/s/p 3:01:02 } +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 761/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.566352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43601 samples/s/p 3:00:37 } +2024-07-25 22:10:27,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 763/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5657291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:27,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43751 samples/s/p 3:00:31 } +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 765/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 1.5651061e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43002 samples/s/p 3:00:43 } +2024-07-25 22:10:33,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 767/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 1.5644831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:33,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42832 samples/s/p 3:00:43 } +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 769/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5638603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:36,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43370 samples/s/p 3:00:30 } +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 771/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.5632373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:39,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43635 samples/s/p 3:00:21 } +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 773/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.5626145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:42,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43485 samples/s/p 3:00:22 } +2024-07-25 22:10:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 775/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.5619917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:45,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43634 samples/s/p 3:00:16 } +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 777/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 1.5613687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.44078 samples/s/p 3:00:04 } +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 779/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5607457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43644 samples/s/p 3:00:10 } +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 781/ 1625], loss: 0.989, per_step_time: 1470ms, lr: 1.5601228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43972 samples/s/p 3:00:00 } +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 783/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 1.5594998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.42786 samples/s/p 3:00:21 } +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 785/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.5588768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43413 samples/s/p 3:00:05 } +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 787/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 1.5582538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43089 samples/s/p 3:00:09 } +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 789/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.5576308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44063 samples/s/p 2:59:46 } +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 791/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.5570082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43848 samples/s/p 2:59:48 } +2024-07-25 22:11:11,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 793/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5563852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44054 samples/s/p 2:59:41 } +2024-07-25 22:11:14,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 795/ 1625], loss: 1.086, per_step_time: 1469ms, lr: 1.5557622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:14,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44565 samples/s/p 2:59:28 } +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 797/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5551394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43763 samples/s/p 2:59:41 } +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 799/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5545163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43268 samples/s/p 2:59:48 } +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 801/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.5538935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43650 samples/s/p 2:59:37 } +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 803/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.5532705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43159 samples/s/p 2:59:44 } +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 805/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 1.5526475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.42885 samples/s/p 2:59:46 } +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 807/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.5520245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43663 samples/s/p 2:59:28 } +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 809/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 1.5514017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:35,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43208 samples/s/p 2:59:34 } +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 811/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5507787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43311 samples/s/p 2:59:29 } +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 813/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5501559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43507 samples/s/p 2:59:22 } +2024-07-25 22:11:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 815/ 1625], loss: 1.127, per_step_time: 1469ms, lr: 1.5495329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44242 samples/s/p 2:59:05 } +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 817/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.5489097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43278 samples/s/p 2:59:21 } +2024-07-25 22:11:50,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 819/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 1.5482869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:50,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43984 samples/s/p 2:59:04 } +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 821/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.5476639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:53,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43072 samples/s/p 2:59:19 } +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 823/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5470408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:56,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43691 samples/s/p 2:59:04 } +2024-07-25 22:11:58,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 825/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 1.546418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:58,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43851 samples/s/p 2:58:58 } +2024-07-25 22:12:01,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 827/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.5457952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:01,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43483 samples/s/p 2:59:02 } +2024-07-25 22:12:04,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 829/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.545172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:04,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.44188 samples/s/p 2:58:45 } +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 831/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.544549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43986 samples/s/p 2:58:46 } +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 833/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.5439264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:10,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43853 samples/s/p 2:58:46 } +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 835/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 1.5433032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.42995 samples/s/p 2:59:00 } +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 837/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 1.5426804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:16,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43034 samples/s/p 2:58:56 } +2024-07-25 22:12:19,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 839/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5420575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:19,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43639 samples/s/p 2:58:41 } +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 841/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.5414344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43363 samples/s/p 2:58:44 } +2024-07-25 22:12:25,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 843/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.5408115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:25,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43580 samples/s/p 2:58:37 } +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 845/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.5401885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.42980 samples/s/p 2:58:45 } +2024-07-25 22:12:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 847/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.5395655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.42998 samples/s/p 2:58:42 } +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 849/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.5389427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43416 samples/s/p 2:58:31 } +2024-07-25 22:12:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 851/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.5383197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43736 samples/s/p 2:58:22 } +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 853/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.5376969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:40,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43504 samples/s/p 2:58:23 } +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 855/ 1625], loss: 1.178, per_step_time: 1468ms, lr: 1.5370739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.44706 samples/s/p 2:57:57 } +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 857/ 1625], loss: 1.029, per_step_time: 1470ms, lr: 1.5364512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43966 samples/s/p 2:58:08 } +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 859/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.535828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43663 samples/s/p 2:58:11 } +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 861/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.535205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43089 samples/s/p 2:58:20 } +2024-07-25 22:12:55,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 863/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 1.5345824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43423 samples/s/p 2:58:10 } +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 865/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5339594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43110 samples/s/p 2:58:13 } +2024-07-25 22:13:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 867/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.5333366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.42890 samples/s/p 2:58:15 } +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 869/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.5327136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43878 samples/s/p 2:57:52 } +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 871/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5320908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43706 samples/s/p 2:57:53 } +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 873/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.5314678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:09,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43540 samples/s/p 2:57:53 } +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 875/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.5308447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43360 samples/s/p 2:57:54 } +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 877/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 1.5302221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44237 samples/s/p 2:57:34 } +2024-07-25 22:13:18,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 879/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.529599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:18,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44123 samples/s/p 2:57:33 } +2024-07-25 22:13:21,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 881/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.5289763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:21,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44051 samples/s/p 2:57:31 } +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 883/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5283535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44046 samples/s/p 2:57:29 } +2024-07-25 22:13:27,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 885/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.5277303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:27,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43231 samples/s/p 2:57:42 } +2024-07-25 22:13:30,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 887/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 1.5271076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:30,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43469 samples/s/p 2:57:34 } +2024-07-25 22:13:33,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 889/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.5264846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:33,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43276 samples/s/p 2:57:35 } +2024-07-25 22:13:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 891/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.5258617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43635 samples/s/p 2:57:25 } +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 893/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.525239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:39,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42816 samples/s/p 2:57:38 } +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 895/ 1625], loss: 1.454, per_step_time: 1473ms, lr: 1.5246163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43032 samples/s/p 2:57:31 } +2024-07-25 22:13:45,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 897/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 1.52399325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.44266 samples/s/p 2:57:04 } +2024-07-25 22:13:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 899/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.5233704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43162 samples/s/p 2:57:22 } +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 901/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.5227477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43344 samples/s/p 2:57:16 } +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 903/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.5221247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.44020 samples/s/p 2:57:00 } +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 905/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 1.5215018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43223 samples/s/p 2:57:12 } +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 907/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.5208791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43058 samples/s/p 2:57:13 } +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 909/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.5202561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43756 samples/s/p 2:56:56 } +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 911/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.5196335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43640 samples/s/p 2:56:55 } +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 913/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.5190108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:08,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43576 samples/s/p 2:56:54 } +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 915/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 1.518388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43354 samples/s/p 2:56:55 } +2024-07-25 22:14:14,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 917/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.517765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:14,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43572 samples/s/p 2:56:48 } +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 919/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.5171423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43698 samples/s/p 2:56:42 } +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 921/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.5165197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:20,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43424 samples/s/p 2:56:45 } +2024-07-25 22:14:23,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 923/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.5158967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:23,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43253 samples/s/p 2:56:45 } +2024-07-25 22:14:26,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 925/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5152741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:26,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43630 samples/s/p 2:56:35 } +2024-07-25 22:14:29,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 927/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.5146513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:29,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43312 samples/s/p 2:56:38 } +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 929/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.5140283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43950 samples/s/p 2:56:23 } +2024-07-25 22:14:35,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 931/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.5134057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:35,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.42946 samples/s/p 2:56:39 } +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 933/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.512783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43383 samples/s/p 2:56:28 } +2024-07-25 22:14:41,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 935/ 1625], loss: 0.977, per_step_time: 1469ms, lr: 1.51216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:41,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.44335 samples/s/p 2:56:07 } +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 937/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.51153745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42819 samples/s/p 2:56:33 } +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 939/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.5109149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43844 samples/s/p 2:56:10 } +2024-07-25 22:14:50,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 941/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.510292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:50,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43789 samples/s/p 2:56:08 } +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 943/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.5096692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42988 samples/s/p 2:56:21 } +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 945/ 1625], loss: 1.348, per_step_time: 1473ms, lr: 1.5090467e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43044 samples/s/p 2:56:17 } +2024-07-25 22:14:58,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 947/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.5084238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:58,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43389 samples/s/p 2:56:07 } +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 949/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.5078011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43791 samples/s/p 2:55:56 } +2024-07-25 22:15:04,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 951/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5071786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:04,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43574 samples/s/p 2:55:58 } +2024-07-25 22:15:07,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 953/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.5065557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:07,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43550 samples/s/p 2:55:55 } +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 955/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.5059332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43364 samples/s/p 2:55:56 } +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 957/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5053105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43497 samples/s/p 2:55:50 } +2024-07-25 22:15:16,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 959/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 1.5046878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43740 samples/s/p 2:55:43 } +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 961/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5040652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43390 samples/s/p 2:55:47 } +2024-07-25 22:15:22,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 963/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5034426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:22,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.42831 samples/s/p 2:55:55 } +2024-07-25 22:15:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 965/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.5028201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43797 samples/s/p 2:55:33 } +2024-07-25 22:15:28,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 967/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.5021974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43511 samples/s/p 2:55:35 } +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 969/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.5015748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43591 samples/s/p 2:55:31 } +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 971/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5009523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43842 samples/s/p 2:55:23 } +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 973/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.5003295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.44145 samples/s/p 2:55:14 } +2024-07-25 22:15:40,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 975/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.499707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:40,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43260 samples/s/p 2:55:29 } +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 977/ 1625], loss: 0.963, per_step_time: 1472ms, lr: 1.4990845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43337 samples/s/p 2:55:24 } +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 979/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.4984617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:46,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43481 samples/s/p 2:55:18 } +2024-07-25 22:15:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 981/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.4978394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43636 samples/s/p 2:55:12 } +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 983/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.4972169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43035 samples/s/p 2:55:21 } +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 985/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.4965942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43642 samples/s/p 2:55:06 } +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 987/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.4959717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43463 samples/s/p 2:55:07 } +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 989/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.49534935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43336 samples/s/p 2:55:06 } +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 991/ 1625], loss: 1.453, per_step_time: 1470ms, lr: 1.4947266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.44036 samples/s/p 2:54:50 } +2024-07-25 22:16:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 993/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 1.4941042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43493 samples/s/p 2:54:58 } +2024-07-25 22:16:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 995/ 1625], loss: 1.162, per_step_time: 1474ms, lr: 1.4934818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.42404 samples/s/p 2:55:16 } +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 997/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.4928592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43724 samples/s/p 2:54:47 } +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 999/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4922369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43084 samples/s/p 2:54:57 } +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1001/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.4916144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43347 samples/s/p 2:54:49 } +2024-07-25 22:16:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1003/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.4909918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43549 samples/s/p 2:54:42 } +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1005/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.4903695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43951 samples/s/p 2:54:31 } +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1007/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.48974705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43248 samples/s/p 2:54:42 } +2024-07-25 22:16:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1009/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.4891244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:30,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43162 samples/s/p 2:54:40 } +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1011/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.4885022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.42872 samples/s/p 2:54:43 } +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1013/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 1.4878799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:36,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43002 samples/s/p 2:54:38 } +2024-07-25 22:16:39,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1015/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.4872577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:39,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43250 samples/s/p 2:54:30 } +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1017/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.4866351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:42,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43509 samples/s/p 2:54:22 } +2024-07-25 22:16:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1019/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 1.4860129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.44007 samples/s/p 2:54:09 } +2024-07-25 22:16:48,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1021/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.4853906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43649 samples/s/p 2:54:13 } +2024-07-25 22:16:51,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1023/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4847682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:51,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43144 samples/s/p 2:54:20 } +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1025/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 1.4841458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.44079 samples/s/p 2:53:59 } +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1027/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 1.4835237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43089 samples/s/p 2:54:15 } +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1029/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.4829013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.42942 samples/s/p 2:54:15 } +2024-07-25 22:17:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1031/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.4822789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:02,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43589 samples/s/p 2:54:00 } +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1033/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.4816568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:05,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43883 samples/s/p 2:53:51 } +2024-07-25 22:17:08,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1035/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.4810344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.44162 samples/s/p 2:53:43 } +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1037/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.4804124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43930 samples/s/p 2:53:44 } +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1039/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.4797901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43523 samples/s/p 2:53:49 } +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1041/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.4791677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.42906 samples/s/p 2:53:58 } +2024-07-25 22:17:20,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1043/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.4785456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43471 samples/s/p 2:53:44 } +2024-07-25 22:17:23,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1045/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.4779234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:23,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43843 samples/s/p 2:53:34 } +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1047/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.4773011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43227 samples/s/p 2:53:43 } +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1049/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.4766791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44044 samples/s/p 2:53:25 } +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1051/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.4760571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44062 samples/s/p 2:53:21 } +2024-07-25 22:17:35,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1053/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.4754348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:35,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43141 samples/s/p 2:53:36 } +2024-07-25 22:17:38,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1055/ 1625], loss: 1.296, per_step_time: 1469ms, lr: 1.4748127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:38,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44307 samples/s/p 2:53:11 } +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1057/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.4741907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43516 samples/s/p 2:53:23 } +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1059/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.4735684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43299 samples/s/p 2:53:24 } +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1061/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.4729463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.42841 samples/s/p 2:53:30 } +2024-07-25 22:17:50,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1063/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.4723245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:50,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43326 samples/s/p 2:53:18 } +2024-07-25 22:17:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1065/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.4717026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:53,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43883 samples/s/p 2:53:04 } +2024-07-25 22:17:56,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1067/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.4710804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:56,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43081 samples/s/p 2:53:16 } +2024-07-25 22:17:58,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1069/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.4704584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:58,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.44030 samples/s/p 2:52:55 } +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1071/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.4698364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42786 samples/s/p 2:53:16 } +2024-07-25 22:18:04,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1073/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 1.4692143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:04,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42626 samples/s/p 2:53:16 } +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1075/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4685923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43322 samples/s/p 2:53:00 } +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1077/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.4679705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43603 samples/s/p 2:52:52 } +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1079/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.4673484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42907 samples/s/p 2:53:02 } +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1081/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 1.4667266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42872 samples/s/p 2:53:00 } +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1083/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.4661047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43524 samples/s/p 2:52:44 } +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1085/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 1.46548255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43103 samples/s/p 2:52:50 } +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1087/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.4648608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43089 samples/s/p 2:52:47 } +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1089/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.464239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43788 samples/s/p 2:52:31 } +2024-07-25 22:18:31,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1091/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.4636169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:31,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43265 samples/s/p 2:52:38 } +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1093/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.4629953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42665 samples/s/p 2:52:46 } +2024-07-25 22:18:37,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1095/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.4623735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43907 samples/s/p 2:52:20 } +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1097/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.4617516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:40,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43469 samples/s/p 2:52:25 } +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1099/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.4611298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43925 samples/s/p 2:52:13 } +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1101/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.46050825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43893 samples/s/p 2:52:11 } +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1103/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 1.4598862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43248 samples/s/p 2:52:20 } +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1105/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4592645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43296 samples/s/p 2:52:16 } +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1107/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.458643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43737 samples/s/p 2:52:05 } +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1109/ 1625], loss: 0.965, per_step_time: 1471ms, lr: 1.45802105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:57,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43525 samples/s/p 2:52:06 } +2024-07-25 22:19:00,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1111/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.4573995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:00,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.44039 samples/s/p 2:51:53 } +2024-07-25 22:19:03,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1113/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.4567779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:03,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43605 samples/s/p 2:51:59 } +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1115/ 1625], loss: 0.994, per_step_time: 1469ms, lr: 1.456156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.44278 samples/s/p 2:51:43 } +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1117/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4555345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:09,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43769 samples/s/p 2:51:50 } +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1119/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 1.45491285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43719 samples/s/p 2:51:48 } +2024-07-25 22:19:15,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1121/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.4542915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:15,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43614 samples/s/p 2:51:47 } +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1123/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.4536697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43148 samples/s/p 2:51:53 } +2024-07-25 22:19:21,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1125/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 1.4530483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:21,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43062 samples/s/p 2:51:51 } +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1127/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 1.45242675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43375 samples/s/p 2:51:43 } +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1129/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.451805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:27,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43433 samples/s/p 2:51:38 } +2024-07-25 22:19:30,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1131/ 1625], loss: 1.150, per_step_time: 1470ms, lr: 1.45118365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:30,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43957 samples/s/p 2:51:26 } +2024-07-25 22:19:33,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1133/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.4505621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:33,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.42839 samples/s/p 2:51:44 } +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1135/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.4499405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43358 samples/s/p 2:51:31 } +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1137/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.4493192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43489 samples/s/p 2:51:26 } +2024-07-25 22:19:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1139/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.4486979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43496 samples/s/p 2:51:23 } +2024-07-25 22:19:45,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1141/ 1625], loss: 1.429, per_step_time: 1471ms, lr: 1.4480763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:45,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43501 samples/s/p 2:51:20 } +2024-07-25 22:19:48,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1143/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.4474548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:48,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43639 samples/s/p 2:51:14 } +2024-07-25 22:19:51,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1145/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.4468337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:51,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.44097 samples/s/p 2:51:02 } +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1147/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.4462121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:54,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43302 samples/s/p 2:51:14 } +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.4455908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43509 samples/s/p 2:51:08 } +2024-07-25 22:19:59,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1151/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 1.4449695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:59,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43464 samples/s/p 2:51:05 } +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1153/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.4443482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43582 samples/s/p 2:51:00 } +2024-07-25 22:20:05,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1155/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.443727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.42739 samples/s/p 2:51:13 } +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1157/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.4431057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43751 samples/s/p 2:50:51 } +2024-07-25 22:20:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1159/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.4424842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43354 samples/s/p 2:50:56 } +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1161/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.4418632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43723 samples/s/p 2:50:46 } +2024-07-25 22:20:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1163/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.441242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:17,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43691 samples/s/p 2:50:44 } +2024-07-25 22:20:20,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1165/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.4406206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:20,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43222 samples/s/p 2:50:49 } +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1167/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.4399996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43540 samples/s/p 2:50:41 } +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1169/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.4393786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43442 samples/s/p 2:50:39 } +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1171/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4387574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43856 samples/s/p 2:50:29 } +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1173/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4381362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43240 samples/s/p 2:50:37 } +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1175/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.4375152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43206 samples/s/p 2:50:35 } +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1177/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4368942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43671 samples/s/p 2:50:23 } +2024-07-25 22:20:41,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1179/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.4362731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43312 samples/s/p 2:50:27 } +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1181/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.435652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43634 samples/s/p 2:50:18 } +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1183/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 1.4350312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42589 samples/s/p 2:50:35 } +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1185/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.4344101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43406 samples/s/p 2:50:17 } +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1187/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 1.4337891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42236 samples/s/p 2:50:36 } +2024-07-25 22:20:56,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1189/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.4331683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:56,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43772 samples/s/p 2:50:04 } +2024-07-25 22:20:58,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1191/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.4325473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43312 samples/s/p 2:50:09 } +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1193/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.4319266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43619 samples/s/p 2:50:01 } +2024-07-25 22:21:04,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1195/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.4313056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:04,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43865 samples/s/p 2:49:53 } +2024-07-25 22:21:07,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1197/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 1.43068455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:07,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.42482 samples/s/p 2:50:16 } +2024-07-25 22:21:10,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1199/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.4300639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:10,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43592 samples/s/p 2:49:52 } +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1201/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.4294431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43283 samples/s/p 2:49:55 } +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1203/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.4288221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43528 samples/s/p 2:49:48 } +2024-07-25 22:21:19,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1205/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.4282015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43753 samples/s/p 2:49:41 } +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1207/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.4275809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43342 samples/s/p 2:49:45 } +2024-07-25 22:21:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1209/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.42696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43224 samples/s/p 2:49:45 } +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1211/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.42633935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:28,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43932 samples/s/p 2:49:28 } +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1213/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.4257189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43924 samples/s/p 2:49:26 } +2024-07-25 22:21:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1215/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.425098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:34,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43219 samples/s/p 2:49:36 } +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1217/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 1.4244773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43887 samples/s/p 2:49:20 } +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1219/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.423857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43594 samples/s/p 2:49:23 } +2024-07-25 22:21:43,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1221/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.4232365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:43,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43887 samples/s/p 2:49:15 } +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1223/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 1.4226158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43239 samples/s/p 2:49:24 } +2024-07-25 22:21:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1225/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.4219952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43546 samples/s/p 2:49:15 } +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1227/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.4213749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43234 samples/s/p 2:49:18 } +2024-07-25 22:21:55,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1229/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 1.4207542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:55,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.42859 samples/s/p 2:49:22 } +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1231/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 1.4201337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43948 samples/s/p 2:48:59 } +2024-07-25 22:22:00,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1233/ 1625], loss: 0.931, per_step_time: 1470ms, lr: 1.4195134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:00,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44051 samples/s/p 2:48:54 } +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1235/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4188929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43367 samples/s/p 2:49:04 } +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1237/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.4182727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:06,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43787 samples/s/p 2:48:53 } +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1239/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.4176523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44065 samples/s/p 2:48:45 } +2024-07-25 22:22:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1241/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.4170318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43759 samples/s/p 2:48:48 } +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.4164116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43287 samples/s/p 2:48:53 } +2024-07-25 22:22:18,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1245/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4157913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43487 samples/s/p 2:48:47 } +2024-07-25 22:22:21,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1247/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.41517085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43131 samples/s/p 2:48:50 } +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1249/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.41455075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43770 samples/s/p 2:48:36 } +2024-07-25 22:22:27,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1251/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.4139307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:27,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43523 samples/s/p 2:48:37 } +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1253/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.4133103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43056 samples/s/p 2:48:43 } +2024-07-25 22:22:33,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1255/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.4126901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:33,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43581 samples/s/p 2:48:30 } +2024-07-25 22:22:36,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1257/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.4120702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:36,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43234 samples/s/p 2:48:34 } +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1259/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4114499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43400 samples/s/p 2:48:28 } +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1261/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.4108297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42609 samples/s/p 2:48:39 } +2024-07-25 22:22:45,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1263/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.4102098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43348 samples/s/p 2:48:23 } +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1265/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.4095896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43498 samples/s/p 2:48:17 } +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1267/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.4089698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42914 samples/s/p 2:48:25 } +2024-07-25 22:22:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1269/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 1.4083497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.44177 samples/s/p 2:47:59 } +2024-07-25 22:22:57,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1271/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.40773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:57,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43463 samples/s/p 2:48:09 } +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1273/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4071099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43790 samples/s/p 2:48:00 } +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1275/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 1.40649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43876 samples/s/p 2:47:55 } +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1277/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.4058703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:05,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43396 samples/s/p 2:48:01 } +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1279/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4052503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43950 samples/s/p 2:47:48 } +2024-07-25 22:23:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1281/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.4046305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:11,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43884 samples/s/p 2:47:46 } +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1283/ 1625], loss: 1.002, per_step_time: 1469ms, lr: 1.4040107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44275 samples/s/p 2:47:36 } +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1285/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.4033908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44211 samples/s/p 2:47:34 } +2024-07-25 22:23:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1287/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.4027712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:20,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43591 samples/s/p 2:47:43 } +2024-07-25 22:23:23,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1289/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.4021515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43248 samples/s/p 2:47:46 } +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1291/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4015315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44210 samples/s/p 2:47:26 } +2024-07-25 22:23:29,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1293/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.4009121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:29,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42947 samples/s/p 2:47:46 } +2024-07-25 22:23:32,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1295/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.4002926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:32,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43658 samples/s/p 2:47:30 } +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1297/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 1.3996728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43997 samples/s/p 2:47:21 } +2024-07-25 22:23:38,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1299/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 1.3990531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:38,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42426 samples/s/p 2:47:47 } +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1301/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.3984339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43939 samples/s/p 2:47:16 } +2024-07-25 22:23:44,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1303/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.39781405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:44,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43965 samples/s/p 2:47:12 } +2024-07-25 22:23:47,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1305/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.3971946e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43298 samples/s/p 2:47:22 } +2024-07-25 22:23:50,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1307/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.3965752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:50,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43697 samples/s/p 2:47:12 } +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1309/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.3959557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:53,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43374 samples/s/p 2:47:15 } +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1311/ 1625], loss: 1.327, per_step_time: 1474ms, lr: 1.3953364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.42630 samples/s/p 2:47:25 } +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1313/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.39471695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43729 samples/s/p 2:47:02 } +2024-07-25 22:24:01,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1315/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.3940975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:01,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43966 samples/s/p 2:46:55 } +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1317/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3934783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:04,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43815 samples/s/p 2:46:55 } +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1319/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 1.3928589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43746 samples/s/p 2:46:53 } +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1321/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.3922399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43524 samples/s/p 2:46:54 } +2024-07-25 22:24:13,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1323/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 1.3916205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:13,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43268 samples/s/p 2:46:56 } +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1325/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.3910014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43424 samples/s/p 2:46:50 } +2024-07-25 22:24:19,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1327/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.3903823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:19,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43324 samples/s/p 2:46:49 } +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1329/ 1625], loss: 1.335, per_step_time: 1470ms, lr: 1.3897629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.44183 samples/s/p 2:46:30 } +2024-07-25 22:24:25,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1331/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.3891439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:25,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43621 samples/s/p 2:46:38 } +2024-07-25 22:24:28,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1333/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.3885248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:28,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43481 samples/s/p 2:46:37 } +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1335/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.38790565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:31,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43860 samples/s/p 2:46:27 } +2024-07-25 22:24:34,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1337/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.3872867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:34,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43227 samples/s/p 2:46:36 } +2024-07-25 22:24:37,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1339/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.3866679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:37,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43875 samples/s/p 2:46:21 } +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1341/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.3860487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43226 samples/s/p 2:46:30 } +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1343/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.3854297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43615 samples/s/p 2:46:20 } +2024-07-25 22:24:46,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1345/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.384811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:46,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43602 samples/s/p 2:46:17 } +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1347/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.3841919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43595 samples/s/p 2:46:15 } +2024-07-25 22:24:52,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1349/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.3835732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:52,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43123 samples/s/p 2:46:20 } +2024-07-25 22:24:55,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1351/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 1.3829544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:55,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.44246 samples/s/p 2:45:57 } +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1353/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.38233545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.42807 samples/s/p 2:46:20 } +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1355/ 1625], loss: 0.868, per_step_time: 1471ms, lr: 1.3817168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43670 samples/s/p 2:46:01 } +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1357/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.3810981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43369 samples/s/p 2:46:04 } +2024-07-25 22:25:06,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1359/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.3804793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:06,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43756 samples/s/p 2:45:54 } +2024-07-25 22:25:09,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1361/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.3798607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:09,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43383 samples/s/p 2:45:58 } +2024-07-25 22:25:12,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1363/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.3792423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:12,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43855 samples/s/p 2:45:46 } +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1365/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.3786234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:15,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43674 samples/s/p 2:45:47 } +2024-07-25 22:25:18,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.3780049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:18,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43627 samples/s/p 2:45:45 } +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1369/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.3773865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43350 samples/s/p 2:45:47 } +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1371/ 1625], loss: 1.344, per_step_time: 1472ms, lr: 1.376768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:24,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43269 samples/s/p 2:45:45 } +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1373/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3761493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43281 samples/s/p 2:45:42 } +2024-07-25 22:25:30,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1375/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.3755311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:30,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43015 samples/s/p 2:45:44 } +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1377/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.3749128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43055 samples/s/p 2:45:40 } +2024-07-25 22:25:36,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1379/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.3742942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:36,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43015 samples/s/p 2:45:38 } +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1381/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.3736759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43563 samples/s/p 2:45:25 } +2024-07-25 22:25:42,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1383/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 1.3730578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:42,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43511 samples/s/p 2:45:23 } +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1385/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.3724393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43505 samples/s/p 2:45:20 } +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1387/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.371821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43944 samples/s/p 2:45:09 } +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1389/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.371203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:51,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43789 samples/s/p 2:45:09 } +2024-07-25 22:25:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1391/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.3705846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43472 samples/s/p 2:45:12 } +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1393/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 1.3699666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.42982 samples/s/p 2:45:18 } +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1395/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.3693485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43246 samples/s/p 2:45:10 } +2024-07-25 22:26:02,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1397/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3687302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:02,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43430 samples/s/p 2:45:04 } +2024-07-25 22:26:05,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1399/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.3681123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:05,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43489 samples/s/p 2:45:00 } +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1401/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.3674943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43355 samples/s/p 2:44:59 } +2024-07-25 22:26:11,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1403/ 1625], loss: 1.364, per_step_time: 1473ms, lr: 1.366876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43027 samples/s/p 2:45:03 } +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1405/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.3662583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:14,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43883 samples/s/p 2:44:44 } +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1407/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.3656406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:17,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43558 samples/s/p 2:44:47 } +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1409/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.3650226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:20,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43463 samples/s/p 2:44:46 } +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1411/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.3644046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43961 samples/s/p 2:44:34 } +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1413/ 1625], loss: 1.189, per_step_time: 1474ms, lr: 1.363787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42706 samples/s/p 2:44:54 } +2024-07-25 22:26:29,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1415/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.363169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:29,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42288 samples/s/p 2:44:58 } +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1417/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3625513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:32,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43706 samples/s/p 2:44:30 } +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1419/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.3619338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43591 samples/s/p 2:44:29 } +2024-07-25 22:26:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1421/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3613162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43670 samples/s/p 2:44:24 } +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1423/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.3606985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43721 samples/s/p 2:44:20 } +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1425/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.36008075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43655 samples/s/p 2:44:19 } +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1427/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.3594635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:47,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.44175 samples/s/p 2:44:06 } +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1429/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.3588457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:50,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43091 samples/s/p 2:44:23 } +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1431/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 1.3582282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43141 samples/s/p 2:44:19 } +2024-07-25 22:26:56,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1433/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.3576108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:56,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43532 samples/s/p 2:44:09 } +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1435/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.3569933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43390 samples/s/p 2:44:09 } +2024-07-25 22:27:01,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1437/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.356376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43549 samples/s/p 2:44:03 } +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1439/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.35575865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43568 samples/s/p 2:44:00 } +2024-07-25 22:27:07,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1441/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3551411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:07,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43197 samples/s/p 2:44:03 } +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1443/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 1.3545241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42520 samples/s/p 2:44:13 } +2024-07-25 22:27:13,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1445/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 1.3539068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:13,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43704 samples/s/p 2:43:48 } +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1447/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.3532894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43788 samples/s/p 2:43:44 } +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1449/ 1625], loss: 1.323, per_step_time: 1475ms, lr: 1.3526724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42296 samples/s/p 2:44:08 } +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1451/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 1.3520554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:22,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43799 samples/s/p 2:43:38 } +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1453/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.3514381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43548 samples/s/p 2:43:39 } +2024-07-25 22:27:28,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1455/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.350821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:28,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43339 samples/s/p 2:43:40 } +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1457/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.3502042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43879 samples/s/p 2:43:28 } +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1459/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.349587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42802 samples/s/p 2:43:44 } +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1461/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.34897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42894 samples/s/p 2:43:39 } +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1463/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.3483533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43305 samples/s/p 2:43:29 } +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1465/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.3477362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43719 samples/s/p 2:43:19 } +2024-07-25 22:27:46,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1467/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 1.3471195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:46,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42544 samples/s/p 2:43:37 } +2024-07-25 22:27:49,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1469/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.3465027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:49,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43252 samples/s/p 2:43:21 } +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1471/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.3458862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43509 samples/s/p 2:43:14 } +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1473/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 1.3452693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42923 samples/s/p 2:43:21 } +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1475/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 1.34465245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42935 samples/s/p 2:43:18 } +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1477/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.344036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42940 samples/s/p 2:43:15 } +2024-07-25 22:28:03,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1479/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.3434192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:03,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43684 samples/s/p 2:42:59 } +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1481/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3428028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43609 samples/s/p 2:42:57 } +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1483/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3421862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43249 samples/s/p 2:43:01 } +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1485/ 1625], loss: 1.308, per_step_time: 1473ms, lr: 1.3415694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42768 samples/s/p 2:43:06 } +2024-07-25 22:28:15,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1487/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 1.3409533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:15,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44029 samples/s/p 2:42:41 } +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1489/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.3403368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43847 samples/s/p 2:42:41 } +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1491/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3397202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43184 samples/s/p 2:42:50 } +2024-07-25 22:28:24,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1493/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3391041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:24,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43566 samples/s/p 2:42:40 } +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1495/ 1625], loss: 1.274, per_step_time: 1470ms, lr: 1.3384878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44170 samples/s/p 2:42:26 } +2024-07-25 22:28:30,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1497/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.3378714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:30,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43561 samples/s/p 2:42:34 } +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1499/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.33725525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44115 samples/s/p 2:42:22 } +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1501/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 1.3366392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43786 samples/s/p 2:42:25 } +2024-07-25 22:28:39,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1503/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.3360228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:39,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43385 samples/s/p 2:42:29 } +2024-07-25 22:28:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1505/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.3354069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43677 samples/s/p 2:42:21 } +2024-07-25 22:28:45,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1507/ 1625], loss: 1.030, per_step_time: 1469ms, lr: 1.3347908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:45,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44421 samples/s/p 2:42:04 } +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1509/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.3341745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:48,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43482 samples/s/p 2:42:18 } +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1511/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 1.3335588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43124 samples/s/p 2:42:22 } +2024-07-25 22:28:54,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1513/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.3329428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:54,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43177 samples/s/p 2:42:18 } +2024-07-25 22:28:57,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1515/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 1.3323266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:57,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44019 samples/s/p 2:42:00 } +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1517/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.331711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:00,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43686 samples/s/p 2:42:03 } +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1519/ 1625], loss: 0.962, per_step_time: 1470ms, lr: 1.3310952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:02,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43870 samples/s/p 2:41:57 } +2024-07-25 22:29:05,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1521/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.3304794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:05,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43449 samples/s/p 2:42:01 } +2024-07-25 22:29:08,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1523/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.3298636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:08,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44072 samples/s/p 2:41:47 } +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1525/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.329248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43199 samples/s/p 2:42:00 } +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1527/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.3286323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43241 samples/s/p 2:41:56 } +2024-07-25 22:29:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1529/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 1.3280165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43974 samples/s/p 2:41:40 } +2024-07-25 22:29:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1531/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.3274011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:20,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43117 samples/s/p 2:41:52 } +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1533/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.3267857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43410 samples/s/p 2:41:44 } +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1535/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.32617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43015 samples/s/p 2:41:48 } +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1537/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3255545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.42941 samples/s/p 2:41:47 } +2024-07-25 22:29:32,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3249392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43355 samples/s/p 2:41:36 } +2024-07-25 22:29:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1541/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.3243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43679 samples/s/p 2:41:28 } +2024-07-25 22:29:38,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1543/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.3237083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:38,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.44021 samples/s/p 2:41:19 } +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1545/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.32309315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43391 samples/s/p 2:41:27 } +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1547/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.3224778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43206 samples/s/p 2:41:27 } +2024-07-25 22:29:47,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1549/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.3218627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:47,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43235 samples/s/p 2:41:24 } +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1551/ 1625], loss: 1.002, per_step_time: 1472ms, lr: 1.3212475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43429 samples/s/p 2:41:17 } +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1553/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3206322e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43665 samples/s/p 2:41:10 } +2024-07-25 22:29:56,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1555/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.3200172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:56,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43577 samples/s/p 2:41:09 } +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1557/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 1.3194022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43003 samples/s/p 2:41:16 } +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1559/ 1625], loss: 1.376, per_step_time: 1474ms, lr: 1.31878705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42561 samples/s/p 2:41:21 } +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1561/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.3181722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:04,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42850 samples/s/p 2:41:13 } +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1563/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.3175575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43828 samples/s/p 2:40:53 } +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1565/ 1625], loss: 1.237, per_step_time: 1474ms, lr: 1.3169424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42728 samples/s/p 2:41:09 } +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1567/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.3163276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43091 samples/s/p 2:41:00 } +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1569/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.315713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43382 samples/s/p 2:40:52 } +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1571/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.3150981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43830 samples/s/p 2:40:41 } +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1573/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.3144833e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43527 samples/s/p 2:40:43 } +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1575/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.3138689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43640 samples/s/p 2:40:38 } +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1577/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.3132543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43503 samples/s/p 2:40:38 } +2024-07-25 22:30:31,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1579/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.3126396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:31,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43553 samples/s/p 2:40:34 } +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1581/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.31202505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:34,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43150 samples/s/p 2:40:38 } +2024-07-25 22:30:37,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1583/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.3114108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:37,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.42933 samples/s/p 2:40:39 } +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1585/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.3107961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43553 samples/s/p 2:40:25 } +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1587/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3101817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43449 samples/s/p 2:40:24 } +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1589/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 1.3095676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43844 samples/s/p 2:40:14 } +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1591/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.30895305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43483 samples/s/p 2:40:17 } +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1593/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 1.3083389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.42256 samples/s/p 2:40:36 } +2024-07-25 22:30:55,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1595/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.3077247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:55,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43346 samples/s/p 2:40:14 } +2024-07-25 22:30:58,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1597/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3071103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:58,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43543 samples/s/p 2:40:08 } +2024-07-25 22:31:01,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1599/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 1.3064964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:01,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43081 samples/s/p 2:40:13 } +2024-07-25 22:31:03,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1601/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3058823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:03,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43291 samples/s/p 2:40:06 } +2024-07-25 22:31:06,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1603/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.30526805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:06,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.44060 samples/s/p 2:39:50 } +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1605/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.3046542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:09,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43283 samples/s/p 2:40:00 } +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1607/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3040404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43384 samples/s/p 2:39:56 } +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1609/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.3034263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43369 samples/s/p 2:39:53 } +2024-07-25 22:31:18,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1611/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 1.3028125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:18,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43409 samples/s/p 2:39:49 } +2024-07-25 22:31:21,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1613/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.3021988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:21,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43443 samples/s/p 2:39:46 } +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1615/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43561 samples/s/p 2:39:41 } +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1617/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.3009712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:27,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43937 samples/s/p 2:39:31 } +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1619/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.3003577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.42933 samples/s/p 2:39:46 } +2024-07-25 22:31:33,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1621/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 1.2997442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:33,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43035 samples/s/p 2:39:41 } +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1623/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.2991304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43779 samples/s/p 2:39:25 } +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1625/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.2985169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43086 samples/s/p 2:39:34 } +2024-07-25 22:31:42,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 2/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.2979036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:42,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43692 samples/s/p 2:39:21 } +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 4/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 1.29729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43923 samples/s/p 2:39:14 } +2024-07-25 22:31:48,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 6/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 1.2966765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:48,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43565 samples/s/p 2:39:17 } +2024-07-25 22:31:51,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 8/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 1.2960634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:51,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.44037 samples/s/p 2:39:06 } +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 10/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.2954499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43798 samples/s/p 2:39:07 } +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 12/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2948367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44019 samples/s/p 2:39:00 } +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 14/ 1625], loss: 1.305, per_step_time: 1469ms, lr: 1.2942235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44341 samples/s/p 2:38:52 } +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 16/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.2936102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43450 samples/s/p 2:39:04 } +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 18/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.2929972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43859 samples/s/p 2:38:54 } +2024-07-25 22:32:08,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 20/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.29238415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:08,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43513 samples/s/p 2:38:57 } +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 22/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 1.2917709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43250 samples/s/p 2:38:59 } +2024-07-25 22:32:14,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 1.29115815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:14,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43357 samples/s/p 2:38:54 } +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 26/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.2905453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:17,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43360 samples/s/p 2:38:51 } +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 28/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.2899323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43743 samples/s/p 2:38:42 } +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 30/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.2893195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43485 samples/s/p 2:38:43 } +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 32/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.2887069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43611 samples/s/p 2:38:38 } +2024-07-25 22:32:29,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 34/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.288094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:29,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43059 samples/s/p 2:38:45 } +2024-07-25 22:32:32,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 36/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.28748125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:32,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43459 samples/s/p 2:38:35 } +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 38/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.2868688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.42977 samples/s/p 2:38:40 } +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 40/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 1.286256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43925 samples/s/p 2:38:21 } +2024-07-25 22:32:41,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 42/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.2856436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:41,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43442 samples/s/p 2:38:26 } +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 44/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.2850312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:44,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43507 samples/s/p 2:38:22 } +2024-07-25 22:32:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 46/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 1.2844189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:47,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43853 samples/s/p 2:38:13 } +2024-07-25 22:32:50,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 48/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.2838063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:50,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43455 samples/s/p 2:38:17 } +2024-07-25 22:32:53,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 50/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 1.2831941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.42940 samples/s/p 2:38:23 } +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 52/ 1625], loss: 1.058, per_step_time: 1769ms, lr: 1.2825818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 4.52033 samples/s/p 3:10:11 } +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 54/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2819694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43322 samples/s/p 2:38:11 } +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 56/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.2813573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.42958 samples/s/p 2:38:14 } +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 58/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.2807452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:37,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43214 samples/s/p 2:38:07 } +2024-07-25 22:33:40,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 60/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.280133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:40,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43181 samples/s/p 2:38:04 } +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 62/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.2795211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43229 samples/s/p 2:38:01 } +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 64/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.2789093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43829 samples/s/p 2:37:47 } +2024-07-25 22:33:49,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 66/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.2782971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43382 samples/s/p 2:37:52 } +2024-07-25 22:33:52,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 68/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2776852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:52,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43187 samples/s/p 2:37:52 } +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 70/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.2770735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43567 samples/s/p 2:37:43 } +2024-07-25 22:33:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 72/ 1625], loss: 1.026, per_step_time: 1469ms, lr: 1.2764615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:58,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.44407 samples/s/p 2:37:25 } +2024-07-25 22:34:01,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 74/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.2758497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:01,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43744 samples/s/p 2:37:34 } +2024-07-25 22:34:04,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 76/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.2752383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:04,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43675 samples/s/p 2:37:32 } +2024-07-25 22:34:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 78/ 1625], loss: 1.090, per_step_time: 1474ms, lr: 1.27462645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:07,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.42731 samples/s/p 2:37:46 } +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 80/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.274015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43747 samples/s/p 2:37:25 } +2024-07-25 22:34:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 82/ 1625], loss: 1.343, per_step_time: 1470ms, lr: 1.27340345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43906 samples/s/p 2:37:19 } +2024-07-25 22:34:16,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 84/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.2727917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:16,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43314 samples/s/p 2:37:27 } +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 86/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 1.27218045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43146 samples/s/p 2:37:27 } +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 88/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.2715691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43497 samples/s/p 2:37:18 } +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 90/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.27095755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43314 samples/s/p 2:37:18 } +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 92/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.2703464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43670 samples/s/p 2:37:09 } +2024-07-25 22:34:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 94/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.2697354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43738 samples/s/p 2:37:05 } +2024-07-25 22:34:33,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 96/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.2691242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43355 samples/s/p 2:37:08 } +2024-07-25 22:34:36,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 98/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.2685128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:37,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43448 samples/s/p 2:37:04 } +2024-07-25 22:34:40,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 100/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.2679019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:40,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43780 samples/s/p 2:36:55 } +2024-07-25 22:34:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 102/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.2672909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43263 samples/s/p 2:37:01 } +2024-07-25 22:34:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 104/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.2666797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43976 samples/s/p 2:36:46 } +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.266069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43463 samples/s/p 2:36:52 } +2024-07-25 22:34:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 108/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.2654583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:52,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43344 samples/s/p 2:36:51 } +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 110/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.2648473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:55,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43908 samples/s/p 2:36:38 } +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 112/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.2642366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43199 samples/s/p 2:36:47 } +2024-07-25 22:35:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 114/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.263626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43379 samples/s/p 2:36:41 } +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 116/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 1.2630152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43939 samples/s/p 2:36:29 } +2024-07-25 22:35:06,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 118/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2624045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43391 samples/s/p 2:36:35 } +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 120/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.2617941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.42823 samples/s/p 2:36:42 } +2024-07-25 22:35:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 122/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.2611835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43500 samples/s/p 2:36:28 } +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 124/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.2605732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43171 samples/s/p 2:36:30 } +2024-07-25 22:35:18,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 126/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.2599628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43810 samples/s/p 2:36:16 } +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 128/ 1625], loss: 0.983, per_step_time: 1471ms, lr: 1.2593522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43514 samples/s/p 2:36:18 } +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 130/ 1625], loss: 0.971, per_step_time: 1470ms, lr: 1.2587421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.44060 samples/s/p 2:36:06 } +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 132/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 1.25813185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43795 samples/s/p 2:36:08 } +2024-07-25 22:35:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 134/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2575216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:30,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43609 samples/s/p 2:36:08 } +2024-07-25 22:35:33,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 136/ 1625], loss: 0.975, per_step_time: 1472ms, lr: 1.2569116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:33,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43449 samples/s/p 2:36:08 } +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 138/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2563017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43204 samples/s/p 2:36:09 } +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 140/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2556915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:39,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43588 samples/s/p 2:36:00 } +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 142/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.2550816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.44118 samples/s/p 2:35:47 } +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 144/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2544717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:45,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43199 samples/s/p 2:36:00 } +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 146/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 1.2538619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43513 samples/s/p 2:35:52 } +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 148/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 1.2532519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.44003 samples/s/p 2:35:41 } +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 150/ 1625], loss: 1.064, per_step_time: 1473ms, lr: 1.2526423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43096 samples/s/p 2:35:53 } +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 152/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.2520328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43613 samples/s/p 2:35:41 } +2024-07-25 22:35:59,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 154/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.2514231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:59,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43419 samples/s/p 2:35:42 } +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 156/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 1.2508134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43531 samples/s/p 2:35:37 } +2024-07-25 22:36:05,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 158/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 1.2502041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:05,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43360 samples/s/p 2:35:37 } +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 160/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.2495944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43223 samples/s/p 2:35:36 } +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 162/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 1.248985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:11,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43980 samples/s/p 2:35:20 } +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 164/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.2483758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42819 samples/s/p 2:35:37 } +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 166/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.2477663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43301 samples/s/p 2:35:26 } +2024-07-25 22:36:20,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 168/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.24715725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:20,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43213 samples/s/p 2:35:25 } +2024-07-25 22:36:23,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 170/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.2465481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:23,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42773 samples/s/p 2:35:29 } +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 172/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.2459387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43191 samples/s/p 2:35:19 } +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 174/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.2453298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43466 samples/s/p 2:35:12 } +2024-07-25 22:36:32,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 176/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.2447208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:32,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43172 samples/s/p 2:35:14 } +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 178/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.2441116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.42930 samples/s/p 2:35:15 } +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 180/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2435029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43701 samples/s/p 2:34:59 } +2024-07-25 22:36:41,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 182/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.2428942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:41,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43381 samples/s/p 2:35:01 } +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.2422852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43608 samples/s/p 2:34:54 } +2024-07-25 22:36:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 186/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.24167655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:47,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43532 samples/s/p 2:34:53 } +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 188/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.241068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43903 samples/s/p 2:34:44 } +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 190/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.2404592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43227 samples/s/p 2:34:52 } +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 192/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.23985055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43310 samples/s/p 2:34:48 } +2024-07-25 22:36:58,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 194/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.2392423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:58,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43889 samples/s/p 2:34:35 } +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 196/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.2386339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43625 samples/s/p 2:34:36 } +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 198/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 1.2380254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43097 samples/s/p 2:34:43 } +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 200/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.237417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43692 samples/s/p 2:34:29 } +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 202/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.2368088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.44008 samples/s/p 2:34:21 } +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 204/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2362005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43172 samples/s/p 2:34:32 } +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 206/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.2355923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43708 samples/s/p 2:34:20 } +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 208/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2349844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.44002 samples/s/p 2:34:12 } +2024-07-25 22:37:22,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 210/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.2343762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:22,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43377 samples/s/p 2:34:20 } +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 212/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.2337684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43575 samples/s/p 2:34:14 } +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 214/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.2331604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42591 samples/s/p 2:34:28 } +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 216/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.2325523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43045 samples/s/p 2:34:17 } +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 1.2319448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42625 samples/s/p 2:34:21 } +2024-07-25 22:37:37,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 220/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.2313371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:37,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43540 samples/s/p 2:34:03 } +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 222/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 1.2307292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.42869 samples/s/p 2:34:11 } +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 224/ 1625], loss: 0.964, per_step_time: 1483ms, lr: 1.2301216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.39234 samples/s/p 2:35:10 } +2024-07-25 22:37:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 226/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.22951415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43581 samples/s/p 2:33:53 } +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 228/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 1.2289065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:49,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.44220 samples/s/p 2:33:39 } +2024-07-25 22:37:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 230/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.2282991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43697 samples/s/p 2:33:45 } +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 232/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.2276918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43756 samples/s/p 2:33:41 } +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 234/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2270843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43250 samples/s/p 2:33:47 } +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 236/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.2264772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.44153 samples/s/p 2:33:29 } +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 238/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.2258699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43302 samples/s/p 2:33:40 } +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 240/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2252626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43137 samples/s/p 2:33:40 } +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 242/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2246556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43818 samples/s/p 2:33:26 } +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 244/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.2240485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43426 samples/s/p 2:33:29 } +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.2234417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43126 samples/s/p 2:33:31 } +2024-07-25 22:38:18,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 248/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.2228347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43728 samples/s/p 2:33:18 } +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 250/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.222228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43560 samples/s/p 2:33:18 } +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 252/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.2216211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43263 samples/s/p 2:33:20 } +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 254/ 1625], loss: 1.171, per_step_time: 1483ms, lr: 1.2210142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.39239 samples/s/p 2:34:26 } +2024-07-25 22:38:30,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 256/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.22040765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:30,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43730 samples/s/p 2:33:06 } +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 258/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.2198011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43366 samples/s/p 2:33:10 } +2024-07-25 22:38:36,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 260/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.2191943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:36,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43777 samples/s/p 2:33:00 } +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 262/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.218588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:39,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43170 samples/s/p 2:33:07 } +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 264/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.21798175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43672 samples/s/p 2:32:56 } +2024-07-25 22:38:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 266/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.2173752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43063 samples/s/p 2:33:03 } +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 268/ 1625], loss: 1.041, per_step_time: 1470ms, lr: 1.2167689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:48,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43864 samples/s/p 2:32:46 } +2024-07-25 22:38:51,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 270/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.2161628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:51,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.44176 samples/s/p 2:32:38 } +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 272/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.2155563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43564 samples/s/p 2:32:46 } +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 274/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.2149503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:57,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43028 samples/s/p 2:32:52 } +2024-07-25 22:39:00,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 276/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.2143444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:00,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43883 samples/s/p 2:32:34 } +2024-07-25 22:39:02,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 278/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.2137382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:02,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43746 samples/s/p 2:32:34 } +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 280/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.2131324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43695 samples/s/p 2:32:32 } +2024-07-25 22:39:08,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 282/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 1.2125265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:08,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43666 samples/s/p 2:32:29 } +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 284/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.2119205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43546 samples/s/p 2:32:28 } +2024-07-25 22:39:14,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 286/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.2113149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42990 samples/s/p 2:32:35 } +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 288/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.2107092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42998 samples/s/p 2:32:32 } +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 290/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.2101034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43255 samples/s/p 2:32:24 } +2024-07-25 22:39:23,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 292/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.209498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:23,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43407 samples/s/p 2:32:19 } +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 294/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 1.2088927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42738 samples/s/p 2:32:27 } +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 296/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2082872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:29,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43592 samples/s/p 2:32:10 } +2024-07-25 22:39:32,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 298/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.2076816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:32,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43254 samples/s/p 2:32:13 } +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 300/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.20707655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:35,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43678 samples/s/p 2:32:03 } +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 302/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 1.2064713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43561 samples/s/p 2:32:02 } +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 304/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.2058658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:41,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43553 samples/s/p 2:31:59 } +2024-07-25 22:39:44,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 306/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.2052609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:44,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43677 samples/s/p 2:31:54 } +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 308/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.204656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42975 samples/s/p 2:32:03 } +2024-07-25 22:39:50,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 310/ 1625], loss: 1.238, per_step_time: 1469ms, lr: 1.2040508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44319 samples/s/p 2:31:37 } +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 312/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.2034459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:53,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43525 samples/s/p 2:31:47 } +2024-07-25 22:39:56,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 314/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.2028412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44021 samples/s/p 2:31:36 } +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 316/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.2022362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42897 samples/s/p 2:31:52 } +2024-07-25 22:40:01,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 318/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.2016315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:01,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43724 samples/s/p 2:31:35 } +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 320/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 1.20102695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:04,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43883 samples/s/p 2:31:30 } +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 322/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 1.2004221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43068 samples/s/p 2:31:40 } +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 324/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.1998178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:10,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43187 samples/s/p 2:31:35 } +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 326/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.1992133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43764 samples/s/p 2:31:23 } +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 328/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.1986087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43564 samples/s/p 2:31:23 } +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 330/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1980044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43255 samples/s/p 2:31:25 } +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 332/ 1625], loss: 1.238, per_step_time: 1474ms, lr: 1.1974002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:22,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.42713 samples/s/p 2:31:32 } +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 334/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1967958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43358 samples/s/p 2:31:18 } +2024-07-25 22:40:28,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 336/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 1.1961917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:28,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43395 samples/s/p 2:31:14 } +2024-07-25 22:40:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 338/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.1955879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43718 samples/s/p 2:31:06 } +2024-07-25 22:40:34,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 340/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1949837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:34,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43446 samples/s/p 2:31:08 } +2024-07-25 22:40:37,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 342/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.1943797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:37,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43507 samples/s/p 2:31:04 } +2024-07-25 22:40:40,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 344/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.1937759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:40,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43252 samples/s/p 2:31:05 } +2024-07-25 22:40:43,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 346/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.1931721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:43,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43121 samples/s/p 2:31:04 } +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 348/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1925681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43592 samples/s/p 2:30:53 } +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 1.1919647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.42860 samples/s/p 2:31:03 } +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 352/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.1913612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43504 samples/s/p 2:30:49 } +2024-07-25 22:40:55,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 354/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1907574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:55,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43353 samples/s/p 2:30:49 } +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 356/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 1.1901539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:58,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.44291 samples/s/p 2:30:30 } +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 358/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.1895506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:01,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43125 samples/s/p 2:30:46 } +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 360/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.1889471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43704 samples/s/p 2:30:34 } +2024-07-25 22:41:06,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 362/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1883438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:06,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43602 samples/s/p 2:30:33 } +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 364/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.1877407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43197 samples/s/p 2:30:36 } +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 366/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.1871373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43488 samples/s/p 2:30:29 } +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 368/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.1865344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:15,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43465 samples/s/p 2:30:26 } +2024-07-25 22:41:18,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 370/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 1.1859313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:18,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43540 samples/s/p 2:30:22 } +2024-07-25 22:41:21,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 372/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.1853283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:21,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43861 samples/s/p 2:30:14 } +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 374/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1847255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43158 samples/s/p 2:30:22 } +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 376/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.1841228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:27,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43257 samples/s/p 2:30:18 } +2024-07-25 22:41:30,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 378/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.1835199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:30,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43138 samples/s/p 2:30:17 } +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 380/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 1.1829171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.42770 samples/s/p 2:30:20 } +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 382/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 1.1823147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43809 samples/s/p 2:30:00 } +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 384/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 1.181712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43882 samples/s/p 2:29:56 } +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 386/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 1.1811094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43611 samples/s/p 2:29:57 } +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 388/ 1625], loss: 1.060, per_step_time: 1468ms, lr: 1.1805072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.44615 samples/s/p 2:29:38 } +2024-07-25 22:41:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 390/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.1799047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43365 samples/s/p 2:29:55 } +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 392/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.1793026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43600 samples/s/p 2:29:48 } +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 394/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 1.1787003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43468 samples/s/p 2:29:48 } +2024-07-25 22:41:57,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 396/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.1780983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:57,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43378 samples/s/p 2:29:46 } +2024-07-25 22:42:00,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 398/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1774961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:00,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43128 samples/s/p 2:29:47 } +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 400/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.1768941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43124 samples/s/p 2:29:45 } +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 402/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.17629215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43728 samples/s/p 2:29:32 } +2024-07-25 22:42:08,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 404/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.17569025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:08,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43529 samples/s/p 2:29:32 } +2024-07-25 22:42:11,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 406/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.1750886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:11,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43422 samples/s/p 2:29:31 } +2024-07-25 22:42:14,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 408/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 1.1744868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:14,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44246 samples/s/p 2:29:14 } +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 410/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.173885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44078 samples/s/p 2:29:14 } +2024-07-25 22:42:20,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 412/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.17328345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:20,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43203 samples/s/p 2:29:26 } +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 414/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1726819e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43460 samples/s/p 2:29:18 } +2024-07-25 22:42:26,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 416/ 1625], loss: 1.134, per_step_time: 1482ms, lr: 1.1720804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:26,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.39591 samples/s/p 2:30:20 } +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 418/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 1.1714791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43777 samples/s/p 2:29:07 } +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 420/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 1.1708779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.42742 samples/s/p 2:29:21 } +2024-07-25 22:42:35,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 422/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.1702766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:35,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43234 samples/s/p 2:29:10 } +2024-07-25 22:42:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 424/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.1696753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43625 samples/s/p 2:29:01 } +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 426/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1690743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43458 samples/s/p 2:29:01 } +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 428/ 1625], loss: 1.312, per_step_time: 1477ms, lr: 1.1684731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.41567 samples/s/p 2:29:29 } +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 430/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.1678721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:47,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.44128 samples/s/p 2:28:44 } +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 432/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.1672715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43508 samples/s/p 2:28:51 } +2024-07-25 22:42:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 434/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.1666704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:53,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43370 samples/s/p 2:28:50 } +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 436/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.1660698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43397 samples/s/p 2:28:47 } +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 438/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 1.1654692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43477 samples/s/p 2:28:43 } +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 440/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.16486835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43527 samples/s/p 2:28:39 } +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 442/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.164268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43835 samples/s/p 2:28:31 } +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 444/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 1.1636675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:07,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43421 samples/s/p 2:28:35 } +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 446/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.1630674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43527 samples/s/p 2:28:30 } +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 448/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.1624667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:13,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43205 samples/s/p 2:28:33 } +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 450/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.1618667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43377 samples/s/p 2:28:27 } +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 452/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.1612665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43465 samples/s/p 2:28:22 } +2024-07-25 22:43:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 454/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.1606662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44003 samples/s/p 2:28:11 } +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 456/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.1600662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44063 samples/s/p 2:28:07 } +2024-07-25 22:43:28,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 458/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.1594662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:28,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43206 samples/s/p 2:28:18 } +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 460/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1588663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43796 samples/s/p 2:28:05 } +2024-07-25 22:43:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 462/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1582666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:34,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43804 samples/s/p 2:28:02 } +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 464/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.157667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44077 samples/s/p 2:27:55 } +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 466/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.1570671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44031 samples/s/p 2:27:53 } +2024-07-25 22:43:43,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 468/ 1625], loss: 1.305, per_step_time: 1474ms, lr: 1.1564674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:43,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42611 samples/s/p 2:28:13 } +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 470/ 1625], loss: 1.021, per_step_time: 1469ms, lr: 1.1558682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44269 samples/s/p 2:27:43 } +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 472/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.15526855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43223 samples/s/p 2:27:57 } +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 474/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1546691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43541 samples/s/p 2:27:49 } +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 476/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.1540699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42911 samples/s/p 2:27:56 } +2024-07-25 22:43:58,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 478/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 1.1534705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:58,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43880 samples/s/p 2:27:37 } +2024-07-25 22:44:01,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 480/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.1528715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:01,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43500 samples/s/p 2:27:41 } +2024-07-25 22:44:03,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 482/ 1625], loss: 1.275, per_step_time: 1470ms, lr: 1.1522724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43851 samples/s/p 2:27:32 } +2024-07-25 22:44:06,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 484/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.1516731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:06,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43992 samples/s/p 2:27:27 } +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 486/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 1.1510744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43425 samples/s/p 2:27:33 } +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 488/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 1.1504755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:12,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43920 samples/s/p 2:27:22 } +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 490/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1498765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43383 samples/s/p 2:27:28 } +2024-07-25 22:44:18,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.149278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.42824 samples/s/p 2:27:34 } +2024-07-25 22:44:21,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 494/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 1.1486794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43254 samples/s/p 2:27:24 } +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 496/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.1480808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43381 samples/s/p 2:27:19 } +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 498/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.1474822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42943 samples/s/p 2:27:23 } +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 500/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.1468839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42941 samples/s/p 2:27:20 } +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 502/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.1462855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42870 samples/s/p 2:27:18 } +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 504/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.1456871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42920 samples/s/p 2:27:15 } +2024-07-25 22:44:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 506/ 1625], loss: 1.135, per_step_time: 1482ms, lr: 1.145089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:39,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.39793 samples/s/p 2:28:03 } +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 508/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.144491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:42,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42907 samples/s/p 2:27:09 } +2024-07-25 22:44:45,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 510/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.1438929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:45,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43243 samples/s/p 2:27:01 } +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 512/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.1432948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43748 samples/s/p 2:26:49 } +2024-07-25 22:44:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1426971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:51,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43414 samples/s/p 2:26:52 } +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 516/ 1625], loss: 1.334, per_step_time: 1470ms, lr: 1.142099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44091 samples/s/p 2:26:38 } +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 518/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.14150125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44336 samples/s/p 2:26:31 } +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 520/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.1409037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43483 samples/s/p 2:26:42 } +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 522/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.140306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43897 samples/s/p 2:26:32 } +2024-07-25 22:45:05,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 524/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.1397086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:05,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43767 samples/s/p 2:26:31 } +2024-07-25 22:45:08,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 526/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.1391111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43462 samples/s/p 2:26:33 } +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 528/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.1385136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43638 samples/s/p 2:26:28 } +2024-07-25 22:45:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 530/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.1379165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:14,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44056 samples/s/p 2:26:18 } +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 532/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.1373192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44120 samples/s/p 2:26:14 } +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 534/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 1.136722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43475 samples/s/p 2:26:22 } +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 536/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.136125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:23,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43307 samples/s/p 2:26:21 } +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 538/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 1.13552815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.42751 samples/s/p 2:26:27 } +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 540/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.134931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43127 samples/s/p 2:26:18 } +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 542/ 1625], loss: 1.105, per_step_time: 1469ms, lr: 1.1343341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44233 samples/s/p 2:25:58 } +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 544/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.1337375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43284 samples/s/p 2:26:10 } +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 546/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1331409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43069 samples/s/p 2:26:10 } +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 548/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.1325442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43674 samples/s/p 2:25:58 } +2024-07-25 22:45:44,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 550/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.13194765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:44,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43205 samples/s/p 2:26:02 } +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 552/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.1313513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43804 samples/s/p 2:25:50 } +2024-07-25 22:45:50,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 554/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.13075475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:50,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43564 samples/s/p 2:25:51 } +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 556/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.1301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:53,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43694 samples/s/p 2:25:46 } +2024-07-25 22:45:56,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 558/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.1295624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43018 samples/s/p 2:25:54 } +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 560/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 1.1289661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:59,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43346 samples/s/p 2:25:45 } +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 562/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.12837015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.44174 samples/s/p 2:25:29 } +2024-07-25 22:46:05,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 564/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 1.1277741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:05,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43427 samples/s/p 2:25:38 } +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 566/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.127178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43394 samples/s/p 2:25:36 } +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 568/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.1265823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:10,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43787 samples/s/p 2:25:26 } +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 570/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 1.1259866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:13,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43668 samples/s/p 2:25:25 } +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 572/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 1.1253907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43520 samples/s/p 2:25:25 } +2024-07-25 22:46:19,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 574/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.1247953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:19,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43772 samples/s/p 2:25:18 } +2024-07-25 22:46:22,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 576/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.1241998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:22,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43620 samples/s/p 2:25:17 } +2024-07-25 22:46:25,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 578/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.1236043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:25,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42786 samples/s/p 2:25:28 } +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 580/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1230089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43420 samples/s/p 2:25:15 } +2024-07-25 22:46:31,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 582/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.1224138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:31,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42837 samples/s/p 2:25:21 } +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 584/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1218183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43412 samples/s/p 2:25:09 } +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 586/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.12122325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43221 samples/s/p 2:25:09 } +2024-07-25 22:46:40,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 588/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.12062835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:40,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43705 samples/s/p 2:24:58 } +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 590/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.1200332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43146 samples/s/p 2:25:04 } +2024-07-25 22:46:46,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 592/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.1194385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:46,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43498 samples/s/p 2:24:56 } +2024-07-25 22:46:49,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 594/ 1625], loss: 0.902, per_step_time: 1468ms, lr: 1.11884365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44602 samples/s/p 2:24:35 } +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 596/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.118249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:52,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43505 samples/s/p 2:24:50 } +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 598/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.1176542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43945 samples/s/p 2:24:40 } +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 600/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.1170596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43026 samples/s/p 2:24:52 } +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 602/ 1625], loss: 1.317, per_step_time: 1474ms, lr: 1.1164652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42590 samples/s/p 2:24:56 } +2024-07-25 22:47:04,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 604/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 1.1158707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:04,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43002 samples/s/p 2:24:46 } +2024-07-25 22:47:06,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 606/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.1152764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:06,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43979 samples/s/p 2:24:27 } +2024-07-25 22:47:09,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 608/ 1625], loss: 1.287, per_step_time: 1470ms, lr: 1.1146822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:09,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44037 samples/s/p 2:24:24 } +2024-07-25 22:47:12,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 610/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.1140879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:12,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43076 samples/s/p 2:24:36 } +2024-07-25 22:47:15,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 612/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.1134939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:15,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43659 samples/s/p 2:24:24 } +2024-07-25 22:47:18,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 614/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.1128999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:18,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43664 samples/s/p 2:24:21 } +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 616/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1123058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:21,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43336 samples/s/p 2:24:23 } +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 618/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.111712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43372 samples/s/p 2:24:20 } +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 620/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.1111185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43289 samples/s/p 2:24:18 } +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 622/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 1.1105246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43867 samples/s/p 2:24:06 } +2024-07-25 22:47:33,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 624/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.109931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:33,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43570 samples/s/p 2:24:08 } +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 626/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.1093375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43347 samples/s/p 2:24:08 } +2024-07-25 22:47:39,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 628/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.108744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43129 samples/s/p 2:24:09 } +2024-07-25 22:47:42,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 630/ 1625], loss: 0.976, per_step_time: 1469ms, lr: 1.1081505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:42,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44239 samples/s/p 2:23:48 } +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 632/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.10755755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:45,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43545 samples/s/p 2:23:56 } +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 634/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.1069641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43455 samples/s/p 2:23:55 } +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 636/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.1063711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43536 samples/s/p 2:23:50 } +2024-07-25 22:47:54,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 638/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.105778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44033 samples/s/p 2:23:40 } +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 640/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.10518495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:57,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43482 samples/s/p 2:23:45 } +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 642/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.1045922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43350 samples/s/p 2:23:45 } +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 644/ 1625], loss: 1.153, per_step_time: 1483ms, lr: 1.1039994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.39421 samples/s/p 2:24:44 } +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 646/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.1034069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:06,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43477 samples/s/p 2:23:37 } +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 648/ 1625], loss: 1.085, per_step_time: 1469ms, lr: 1.1028141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.44514 samples/s/p 2:23:17 } +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 650/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 1.1022217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43689 samples/s/p 2:23:27 } +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 652/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.1016292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43385 samples/s/p 2:23:29 } +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 654/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.10103665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43018 samples/s/p 2:23:32 } +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 656/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.1004445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:20,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43818 samples/s/p 2:23:16 } +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 658/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.0998522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43304 samples/s/p 2:23:22 } +2024-07-25 22:48:26,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 660/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.09926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:26,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43398 samples/s/p 2:23:17 } +2024-07-25 22:48:29,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 662/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.098668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:29,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43699 samples/s/p 2:23:10 } +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 664/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.0980762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43378 samples/s/p 2:23:12 } +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 666/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.0974843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43391 samples/s/p 2:23:09 } +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 668/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.0968924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43691 samples/s/p 2:23:01 } +2024-07-25 22:48:41,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 670/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.0963008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:41,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.44124 samples/s/p 2:22:51 } +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 672/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 1.095709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.42966 samples/s/p 2:23:06 } +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 674/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 1.0951174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43545 samples/s/p 2:22:54 } +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 676/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.0945262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43465 samples/s/p 2:22:53 } +2024-07-25 22:48:53,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 678/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.0939346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:53,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43685 samples/s/p 2:22:46 } +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 680/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.0933434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:56,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43323 samples/s/p 2:22:49 } +2024-07-25 22:48:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 682/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.0927522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43054 samples/s/p 2:22:50 } +2024-07-25 22:49:02,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 684/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.0921609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:02,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43465 samples/s/p 2:22:41 } +2024-07-25 22:49:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 686/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.0915701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:05,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43105 samples/s/p 2:22:44 } +2024-07-25 22:49:07,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 688/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.0909791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:07,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43259 samples/s/p 2:22:38 } +2024-07-25 22:49:10,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 690/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.0903882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:10,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43663 samples/s/p 2:22:29 } +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 692/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.0897974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:13,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43877 samples/s/p 2:22:23 } +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 694/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.08920685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43568 samples/s/p 2:22:25 } +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 696/ 1625], loss: 1.368, per_step_time: 1472ms, lr: 1.088616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43442 samples/s/p 2:22:24 } +2024-07-25 22:49:22,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 698/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0880255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:22,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43528 samples/s/p 2:22:19 } +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 700/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.0874353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43497 samples/s/p 2:22:17 } +2024-07-25 22:49:28,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 702/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.086845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:28,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43299 samples/s/p 2:22:17 } +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 704/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0862545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43437 samples/s/p 2:22:12 } +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 706/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.0856644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43033 samples/s/p 2:22:15 } +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 708/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 1.0850745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43049 samples/s/p 2:22:12 } +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 710/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.0844842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43814 samples/s/p 2:21:57 } +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.0838942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43860 samples/s/p 2:21:53 } +2024-07-25 22:49:46,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 714/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.0833046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:46,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42832 samples/s/p 2:22:07 } +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 716/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.0827147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43374 samples/s/p 2:21:55 } +2024-07-25 22:49:52,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 718/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.0821252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:52,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43778 samples/s/p 2:21:46 } +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 720/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.08153545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.44333 samples/s/p 2:21:34 } +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 722/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 1.0809458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43819 samples/s/p 2:21:39 } +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 724/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.0803566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43200 samples/s/p 2:21:46 } +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 726/ 1625], loss: 0.949, per_step_time: 1472ms, lr: 1.0797673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43246 samples/s/p 2:21:42 } +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 728/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.0791779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43412 samples/s/p 2:21:37 } +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 730/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.0785889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43853 samples/s/p 2:21:27 } +2024-07-25 22:50:12,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 732/ 1625], loss: 1.101, per_step_time: 1474ms, lr: 1.0779999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:12,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.42548 samples/s/p 2:21:45 } +2024-07-25 22:50:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 734/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.0774107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43997 samples/s/p 2:21:19 } +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 736/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.0768219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43190 samples/s/p 2:21:29 } +2024-07-25 22:50:21,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 738/ 1625], loss: 1.001, per_step_time: 1470ms, lr: 1.0762332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:21,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44051 samples/s/p 2:21:12 } +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 740/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0756443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43687 samples/s/p 2:21:15 } +2024-07-25 22:50:27,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 742/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.0750557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43032 samples/s/p 2:21:22 } +2024-07-25 22:50:30,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 744/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.0744673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:30,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43627 samples/s/p 2:21:10 } +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 746/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 1.0738787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.42909 samples/s/p 2:21:18 } +2024-07-25 22:50:36,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 748/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.0732904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:36,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43313 samples/s/p 2:21:09 } +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 750/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0727022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43541 samples/s/p 2:21:03 } +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 752/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 1.0721141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43333 samples/s/p 2:21:03 } +2024-07-25 22:50:45,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 754/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0715258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:45,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43579 samples/s/p 2:20:56 } +2024-07-25 22:50:48,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 756/ 1625], loss: 0.860, per_step_time: 1470ms, lr: 1.0709378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43875 samples/s/p 2:20:48 } +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 758/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.07035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42885 samples/s/p 2:21:01 } +2024-07-25 22:50:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 760/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 1.069762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.44248 samples/s/p 2:20:37 } +2024-07-25 22:50:57,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 762/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 1.0691743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:57,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42961 samples/s/p 2:20:54 } +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 764/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0685868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42971 samples/s/p 2:20:51 } +2024-07-25 22:51:03,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 766/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.067999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:03,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43221 samples/s/p 2:20:44 } +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 768/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.0674116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:06,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42917 samples/s/p 2:20:46 } +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 770/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.0668243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43199 samples/s/p 2:20:38 } +2024-07-25 22:51:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 772/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.0662368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:11,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43712 samples/s/p 2:20:27 } +2024-07-25 22:51:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 774/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 1.0656497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43296 samples/s/p 2:20:31 } +2024-07-25 22:51:17,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 776/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 1.0650628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:17,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43096 samples/s/p 2:20:31 } +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 778/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0644755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:20,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43721 samples/s/p 2:20:19 } +2024-07-25 22:51:23,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 780/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.0638886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:23,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43007 samples/s/p 2:20:27 } +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 782/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 1.0633018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43580 samples/s/p 2:20:15 } +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 784/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.062715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43120 samples/s/p 2:20:19 } +2024-07-25 22:51:32,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 786/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 1.0621283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:32,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43119 samples/s/p 2:20:16 } +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 788/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0615418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.42990 samples/s/p 2:20:15 } +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 790/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.0609552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43507 samples/s/p 2:20:04 } +2024-07-25 22:51:41,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 792/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.0603689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:41,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43725 samples/s/p 2:19:58 } +2024-07-25 22:51:44,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 794/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 1.0597825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:44,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43072 samples/s/p 2:20:05 } +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 796/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0591963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43216 samples/s/p 2:20:00 } +2024-07-25 22:51:50,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 798/ 1625], loss: 1.408, per_step_time: 1471ms, lr: 1.0586102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:50,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43482 samples/s/p 2:19:53 } +2024-07-25 22:51:53,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 800/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0580241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:53,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43682 samples/s/p 2:19:47 } +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 802/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.0574383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43327 samples/s/p 2:19:49 } +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 804/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0568523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43772 samples/s/p 2:19:39 } +2024-07-25 22:52:02,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 806/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 1.0562667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:02,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43107 samples/s/p 2:19:47 } +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 808/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.055681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43456 samples/s/p 2:19:38 } +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 810/ 1625], loss: 0.900, per_step_time: 1470ms, lr: 1.05509525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43970 samples/s/p 2:19:28 } +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 812/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.0545098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43523 samples/s/p 2:19:32 } +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 814/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0539245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43314 samples/s/p 2:19:32 } +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 816/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0533389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43725 samples/s/p 2:19:23 } +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 818/ 1625], loss: 1.343, per_step_time: 1472ms, lr: 1.05275385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43401 samples/s/p 2:19:25 } +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 820/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.0521689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43826 samples/s/p 2:19:15 } +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 822/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.0515838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43492 samples/s/p 2:19:17 } +2024-07-25 22:52:28,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 824/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 1.0509987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:28,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43475 samples/s/p 2:19:15 } +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 826/ 1625], loss: 1.294, per_step_time: 1474ms, lr: 1.0504141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.42538 samples/s/p 2:19:26 } +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 828/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.0498291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43249 samples/s/p 2:19:12 } +2024-07-25 22:52:37,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 830/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.0492444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:37,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43585 samples/s/p 2:19:04 } +2024-07-25 22:52:40,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 832/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0486599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:40,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43433 samples/s/p 2:19:03 } +2024-07-25 22:52:43,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 834/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0480753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:43,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43694 samples/s/p 2:18:57 } +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 836/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.04749115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43946 samples/s/p 2:18:50 } +2024-07-25 22:52:49,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 838/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0469068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:49,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43538 samples/s/p 2:18:53 } +2024-07-25 22:52:52,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 840/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 1.04632245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:52,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43861 samples/s/p 2:18:45 } +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 842/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.0457384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:55,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43966 samples/s/p 2:18:41 } +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 844/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.0451544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44073 samples/s/p 2:18:36 } +2024-07-25 22:53:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 846/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0445704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43598 samples/s/p 2:18:40 } +2024-07-25 22:53:04,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 848/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0439867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:04,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43813 samples/s/p 2:18:34 } +2024-07-25 22:53:07,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 850/ 1625], loss: 1.063, per_step_time: 1469ms, lr: 1.043403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44373 samples/s/p 2:18:23 } +2024-07-25 22:53:09,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 852/ 1625], loss: 1.396, per_step_time: 1472ms, lr: 1.0428194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:09,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43139 samples/s/p 2:18:39 } +2024-07-25 22:53:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 854/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0422356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:12,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43476 samples/s/p 2:18:30 } +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 856/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.0416523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43888 samples/s/p 2:18:21 } +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 858/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0410689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43445 samples/s/p 2:18:25 } +2024-07-25 22:53:21,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 860/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.0404857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:21,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43560 samples/s/p 2:18:20 } +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 862/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0399025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43959 samples/s/p 2:18:11 } +2024-07-25 22:53:27,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 864/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0393195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:27,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43789 samples/s/p 2:18:11 } +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 866/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 1.03873645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43158 samples/s/p 2:18:18 } +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 868/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0381535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43601 samples/s/p 2:18:08 } +2024-07-25 22:53:36,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 870/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.03757075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43434 samples/s/p 2:18:08 } +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 872/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.036988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43742 samples/s/p 2:18:00 } +2024-07-25 22:53:42,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 874/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.0364055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:42,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43831 samples/s/p 2:17:56 } +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 876/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.035823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44327 samples/s/p 2:17:45 } +2024-07-25 22:53:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 878/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.03524035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:48,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43686 samples/s/p 2:17:52 } +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 880/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 1.0346582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44110 samples/s/p 2:17:43 } +2024-07-25 22:53:54,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 882/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.0340759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:54,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44162 samples/s/p 2:17:39 } +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 884/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 1.0334936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43313 samples/s/p 2:17:49 } +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 886/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.0329118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43342 samples/s/p 2:17:45 } +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 888/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.03233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:03,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43009 samples/s/p 2:17:47 } +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 890/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.031748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43295 samples/s/p 2:17:40 } +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 892/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.0311662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43182 samples/s/p 2:17:39 } +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 894/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0305846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43145 samples/s/p 2:17:37 } +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 896/ 1625], loss: 1.133, per_step_time: 1469ms, lr: 1.0300029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.44250 samples/s/p 2:17:17 } +2024-07-25 22:54:17,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 898/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.0294214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:17,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43090 samples/s/p 2:17:32 } +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 900/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 1.0288402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.42762 samples/s/p 2:17:34 } +2024-07-25 22:54:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 902/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.0282591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:23,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43760 samples/s/p 2:17:15 } +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 904/ 1625], loss: 1.455, per_step_time: 1470ms, lr: 1.0276777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44123 samples/s/p 2:17:07 } +2024-07-25 22:54:29,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 906/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 1.0270966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:29,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43600 samples/s/p 2:17:12 } +2024-07-25 22:54:32,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 908/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.0265158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:32,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44003 samples/s/p 2:17:03 } +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 910/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 1.0259348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43071 samples/s/p 2:17:14 } +2024-07-25 22:54:38,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 912/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.025354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:38,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43494 samples/s/p 2:17:05 } +2024-07-25 22:54:41,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 914/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0247734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:41,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43456 samples/s/p 2:17:02 } +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 916/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.0241926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:44,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44026 samples/s/p 2:16:51 } +2024-07-25 22:54:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 918/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0236123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:47,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44207 samples/s/p 2:16:45 } +2024-07-25 22:54:50,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 920/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.0230318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:50,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43434 samples/s/p 2:16:54 } +2024-07-25 22:54:53,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 922/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.0224514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:53,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43996 samples/s/p 2:16:43 } +2024-07-25 22:54:56,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 924/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.0218713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:56,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43103 samples/s/p 2:16:53 } +2024-07-25 22:54:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 926/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0212912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43575 samples/s/p 2:16:43 } +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 928/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.020711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:02,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43660 samples/s/p 2:16:39 } +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 930/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.0201312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43685 samples/s/p 2:16:35 } +2024-07-25 22:55:07,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 932/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.0195516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43571 samples/s/p 2:16:34 } +2024-07-25 22:55:10,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 934/ 1625], loss: 1.258, per_step_time: 1475ms, lr: 1.0189717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:10,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.42356 samples/s/p 2:16:50 } +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 936/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.01839205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43072 samples/s/p 2:16:36 } +2024-07-25 22:55:16,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 938/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.0178127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:16,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43419 samples/s/p 2:16:28 } +2024-07-25 22:55:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 940/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.017233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:19,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43294 samples/s/p 2:16:27 } +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 942/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.0166537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43577 samples/s/p 2:16:19 } +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 944/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 1.0160747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.42963 samples/s/p 2:16:26 } +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 946/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.0154953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43978 samples/s/p 2:16:07 } +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 948/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.0149164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43327 samples/s/p 2:16:14 } +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 950/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.0143374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43835 samples/s/p 2:16:04 } +2024-07-25 22:55:37,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 952/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.0137587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:37,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43476 samples/s/p 2:16:06 } +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 954/ 1625], loss: 1.328, per_step_time: 1469ms, lr: 1.0131798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44234 samples/s/p 2:15:52 } +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 956/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.0126013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43058 samples/s/p 2:16:07 } +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 958/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.0120229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43831 samples/s/p 2:15:52 } +2024-07-25 22:55:49,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 960/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 1.0114442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:49,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43477 samples/s/p 2:15:54 } +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 962/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.0108661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43473 samples/s/p 2:15:52 } +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 964/ 1625], loss: 1.234, per_step_time: 1469ms, lr: 1.0102878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44251 samples/s/p 2:15:37 } +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 966/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0097095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43596 samples/s/p 2:15:44 } +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 968/ 1625], loss: 1.263, per_step_time: 1470ms, lr: 1.0091317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.44198 samples/s/p 2:15:32 } +2024-07-25 22:56:04,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 970/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.0085536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:04,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43302 samples/s/p 2:15:42 } +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 972/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0079756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:07,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43513 samples/s/p 2:15:36 } +2024-07-25 22:56:09,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 974/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0073981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:09,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43795 samples/s/p 2:15:29 } +2024-07-25 22:56:12,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 976/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.00682055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:12,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43479 samples/s/p 2:15:31 } +2024-07-25 22:56:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 978/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0062429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43699 samples/s/p 2:15:25 } +2024-07-25 22:56:18,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 980/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 1.0056654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:18,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43440 samples/s/p 2:15:26 } +2024-07-25 22:56:21,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 982/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0050881e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:21,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43193 samples/s/p 2:15:26 } +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 984/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0045107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43523 samples/s/p 2:15:18 } +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 986/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.0039336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43506 samples/s/p 2:15:16 } +2024-07-25 22:56:30,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 988/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0033567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:30,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43340 samples/s/p 2:15:15 } +2024-07-25 22:56:33,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 990/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.0027797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:33,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43022 samples/s/p 2:15:17 } +2024-07-25 22:56:36,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 992/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 1.00220295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:36,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43090 samples/s/p 2:15:13 } +2024-07-25 22:56:39,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 994/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 1.00162615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:39,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43117 samples/s/p 2:15:10 } +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 996/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.00104935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43768 samples/s/p 2:14:57 } +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 998/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.0004731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43525 samples/s/p 2:14:58 } +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1000/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 9.998966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43785 samples/s/p 2:14:51 } +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1002/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 9.993204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.44088 samples/s/p 2:14:43 } +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1004/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 9.9874405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43746 samples/s/p 2:14:46 } +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1006/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 9.981681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43666 samples/s/p 2:14:44 } +2024-07-25 22:57:00,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1008/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 9.975919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:00,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.42984 samples/s/p 2:14:51 } +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1010/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 9.970159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43484 samples/s/p 2:14:41 } +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1012/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.964402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:06,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43984 samples/s/p 2:14:30 } +2024-07-25 22:57:08,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1014/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 9.958644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:08,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43468 samples/s/p 2:14:35 } +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1016/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 9.952889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43763 samples/s/p 2:14:28 } +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1018/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 9.9471345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43673 samples/s/p 2:14:26 } +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1020/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 9.941381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43592 samples/s/p 2:14:24 } +2024-07-25 22:57:20,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1022/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 9.935626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:20,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43927 samples/s/p 2:14:16 } +2024-07-25 22:57:23,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1024/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 9.929874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:23,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43276 samples/s/p 2:14:23 } +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1026/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.924124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43392 samples/s/p 2:14:19 } +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1028/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 9.918373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43293 samples/s/p 2:14:17 } +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1030/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 9.9126255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43747 samples/s/p 2:14:07 } +2024-07-25 22:57:35,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1032/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 9.906877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:35,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43096 samples/s/p 2:14:14 } +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1034/ 1625], loss: 1.413, per_step_time: 1471ms, lr: 9.901129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43579 samples/s/p 2:14:04 } +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1036/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 9.895383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43824 samples/s/p 2:13:57 } +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1038/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 9.88964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43455 samples/s/p 2:14:00 } +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1040/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 9.883894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:47,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43413 samples/s/p 2:13:58 } +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1042/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 9.878152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43712 samples/s/p 2:13:50 } +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1044/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 9.872412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43260 samples/s/p 2:13:54 } +2024-07-25 22:57:56,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1046/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 9.866669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:56,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.42843 samples/s/p 2:13:57 } +2024-07-25 22:57:59,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1048/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 9.860931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:59,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43272 samples/s/p 2:13:48 } +2024-07-25 22:58:02,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1050/ 1625], loss: 0.856, per_step_time: 1471ms, lr: 9.855194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:02,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43831 samples/s/p 2:13:37 } +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1052/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 9.849455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43783 samples/s/p 2:13:34 } +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1054/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 9.843717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43320 samples/s/p 2:13:38 } +2024-07-25 22:58:10,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1056/ 1625], loss: 1.144, per_step_time: 1469ms, lr: 9.837982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:10,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.44247 samples/s/p 2:13:22 } +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1058/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 9.83225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43233 samples/s/p 2:13:34 } +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1060/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 9.826515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43418 samples/s/p 2:13:28 } +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1062/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 9.820782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43311 samples/s/p 2:13:27 } +2024-07-25 22:58:22,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1064/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 9.815052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:22,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43196 samples/s/p 2:13:25 } +2024-07-25 22:58:25,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1066/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 9.8093205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:25,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.44114 samples/s/p 2:13:09 } +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1068/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 9.803592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:28,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.42301 samples/s/p 2:13:33 } +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1070/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 9.797865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43342 samples/s/p 2:13:14 } +2024-07-25 22:58:34,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1072/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 9.792137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:34,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43793 samples/s/p 2:13:05 } +2024-07-25 22:58:37,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1074/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 9.786411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:37,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43643 samples/s/p 2:13:04 } +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1076/ 1625], loss: 1.238, per_step_time: 1476ms, lr: 9.780687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.41863 samples/s/p 2:13:27 } +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1078/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 9.774961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:43,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43669 samples/s/p 2:12:58 } +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1080/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 9.769238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:46,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43674 samples/s/p 2:12:55 } +2024-07-25 22:58:49,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1082/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 9.7635175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:49,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43583 samples/s/p 2:12:53 } +2024-07-25 22:58:52,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1084/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.757795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:52,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43755 samples/s/p 2:12:48 } +2024-07-25 22:58:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1086/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 9.752076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:55,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44043 samples/s/p 2:12:41 } +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1088/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 9.74636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:58,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43811 samples/s/p 2:12:41 } +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1090/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 9.74064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44159 samples/s/p 2:12:33 } +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1092/ 1625], loss: 0.914, per_step_time: 1470ms, lr: 9.734924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44117 samples/s/p 2:12:31 } +2024-07-25 22:59:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1094/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 9.72921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:07,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43816 samples/s/p 2:12:32 } +2024-07-25 22:59:09,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1096/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.723492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:09,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43463 samples/s/p 2:12:34 } +2024-07-25 22:59:12,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1098/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 9.71778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:12,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43114 samples/s/p 2:12:37 } +2024-07-25 22:59:15,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1100/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 9.712069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:15,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43417 samples/s/p 2:12:29 } +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1102/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 9.706359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43024 samples/s/p 2:12:32 } +2024-07-25 22:59:21,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1104/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 9.700648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:21,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42607 samples/s/p 2:12:35 } +2024-07-25 22:59:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1106/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.694939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:24,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42971 samples/s/p 2:12:27 } +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1108/ 1625], loss: 1.100, per_step_time: 1475ms, lr: 9.689233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:27,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42211 samples/s/p 2:12:35 } +2024-07-25 22:59:30,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1110/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 9.683524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43450 samples/s/p 2:12:14 } +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1112/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 9.677818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43428 samples/s/p 2:12:11 } +2024-07-25 22:59:36,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1114/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 9.672114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:36,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43757 samples/s/p 2:12:04 } +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1116/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 9.66641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:39,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43654 samples/s/p 2:12:02 } +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1118/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 9.660708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43567 samples/s/p 2:12:01 } +2024-07-25 22:59:45,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1120/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.655007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:45,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43738 samples/s/p 2:11:55 } +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1122/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.649304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43574 samples/s/p 2:11:55 } +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1124/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 9.643607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43892 samples/s/p 2:11:47 } +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1126/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 9.637908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42868 samples/s/p 2:11:59 } +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1128/ 1625], loss: 1.062, per_step_time: 1474ms, lr: 9.632209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:57,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42659 samples/s/p 2:11:59 } +2024-07-25 23:00:00,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1130/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 9.626515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:00,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43116 samples/s/p 2:11:49 } +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1132/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.620821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43924 samples/s/p 2:11:35 } +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1134/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 9.615126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43184 samples/s/p 2:11:43 } +2024-07-25 23:00:08,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1136/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 9.609432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:09,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.42698 samples/s/p 2:11:47 } +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1138/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 9.603742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43791 samples/s/p 2:11:28 } +2024-07-25 23:00:14,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1140/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 9.5980495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:14,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43674 samples/s/p 2:11:27 } +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1142/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 9.592361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43588 samples/s/p 2:11:25 } +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1144/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 9.586673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43126 samples/s/p 2:11:29 } +2024-07-25 23:00:23,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1146/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 9.580984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:23,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42983 samples/s/p 2:11:28 } +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1148/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 9.5752985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43782 samples/s/p 2:11:13 } +2024-07-25 23:00:29,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1150/ 1625], loss: 1.355, per_step_time: 1470ms, lr: 9.569613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:29,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43886 samples/s/p 2:11:09 } +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1152/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 9.563931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43036 samples/s/p 2:11:18 } +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1154/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 9.558246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.44212 samples/s/p 2:10:58 } +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1156/ 1625], loss: 0.959, per_step_time: 1473ms, lr: 9.552564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42920 samples/s/p 2:11:14 } +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1158/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 9.546885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43234 samples/s/p 2:11:06 } +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1160/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 9.541203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42824 samples/s/p 2:11:09 } +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1162/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 9.535527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43945 samples/s/p 2:10:50 } +2024-07-25 23:00:50,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1164/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 9.529848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:50,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43386 samples/s/p 2:10:55 } +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1166/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 9.52417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43157 samples/s/p 2:10:56 } +2024-07-25 23:00:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1168/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 9.518497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.42816 samples/s/p 2:10:58 } +2024-07-25 23:00:59,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1170/ 1625], loss: 1.179, per_step_time: 1469ms, lr: 9.5128225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:59,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44222 samples/s/p 2:10:35 } +2024-07-25 23:01:02,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1172/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.507149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:02,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43869 samples/s/p 2:10:37 } +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1174/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 9.5014775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43566 samples/s/p 2:10:38 } +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1176/ 1625], loss: 0.935, per_step_time: 1468ms, lr: 9.495808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44634 samples/s/p 2:10:20 } +2024-07-25 23:01:10,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1178/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 9.490135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:10,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43418 samples/s/p 2:10:34 } +2024-07-25 23:01:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1180/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 9.484467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43530 samples/s/p 2:10:30 } +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1182/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 9.478801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:16,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43513 samples/s/p 2:10:27 } +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1184/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 9.473134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43033 samples/s/p 2:10:31 } +2024-07-25 23:01:22,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1186/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 9.46747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43566 samples/s/p 2:10:20 } +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1188/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 9.461806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43920 samples/s/p 2:10:12 } +2024-07-25 23:01:28,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1190/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 9.45614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:28,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43267 samples/s/p 2:10:19 } +2024-07-25 23:01:31,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1192/ 1625], loss: 1.165, per_step_time: 1475ms, lr: 9.450478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:31,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42320 samples/s/p 2:10:30 } +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1194/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 9.4448205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42866 samples/s/p 2:10:19 } +2024-07-25 23:01:37,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1196/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 9.439157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:37,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43654 samples/s/p 2:10:04 } +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1198/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 9.433498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43606 samples/s/p 2:10:02 } +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1200/ 1625], loss: 1.250, per_step_time: 1475ms, lr: 9.427843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42235 samples/s/p 2:10:19 } +2024-07-25 23:01:46,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1202/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 9.422187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43510 samples/s/p 2:09:58 } +2024-07-25 23:01:49,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1204/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 9.416531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:49,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43646 samples/s/p 2:09:53 } +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1206/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 9.410877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42919 samples/s/p 2:10:00 } +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1208/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 9.405225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43315 samples/s/p 2:09:52 } +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1210/ 1625], loss: 0.981, per_step_time: 1471ms, lr: 9.399572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43576 samples/s/p 2:09:45 } +2024-07-25 23:02:01,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1212/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 9.393922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:01,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43536 samples/s/p 2:09:43 } +2024-07-25 23:02:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1214/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 9.388271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:04,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44164 samples/s/p 2:09:31 } +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1216/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 9.382622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43453 samples/s/p 2:09:38 } +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1218/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 9.376975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44184 samples/s/p 2:09:25 } +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1220/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.371329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43803 samples/s/p 2:09:27 } +2024-07-25 23:02:15,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1222/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 9.365684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:15,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43933 samples/s/p 2:09:22 } +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1224/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 9.36004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43606 samples/s/p 2:09:24 } +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1226/ 1625], loss: 0.925, per_step_time: 1471ms, lr: 9.354397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43670 samples/s/p 2:09:20 } +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1228/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 9.348755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:24,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43955 samples/s/p 2:09:13 } +2024-07-25 23:02:27,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1230/ 1625], loss: 0.979, per_step_time: 1469ms, lr: 9.3431145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:27,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.44333 samples/s/p 2:09:05 } +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1232/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 9.337477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43983 samples/s/p 2:09:07 } +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1234/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 9.331837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43137 samples/s/p 2:09:16 } +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1236/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 9.326199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:36,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43207 samples/s/p 2:09:12 } +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1238/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 9.320565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43186 samples/s/p 2:09:09 } +2024-07-25 23:02:42,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1240/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 9.314927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:42,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43538 samples/s/p 2:09:01 } +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1242/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.309294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43205 samples/s/p 2:09:03 } +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1244/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 9.303664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43617 samples/s/p 2:08:54 } +2024-07-25 23:02:51,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1246/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 9.29803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:51,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43236 samples/s/p 2:08:57 } +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1248/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 9.292402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43743 samples/s/p 2:08:47 } +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1250/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 9.286772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43644 samples/s/p 2:08:45 } +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1252/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.281144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43054 samples/s/p 2:08:51 } +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1254/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 9.275517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43906 samples/s/p 2:08:36 } +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1256/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 9.269891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.44018 samples/s/p 2:08:31 } +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1258/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 9.264267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.42914 samples/s/p 2:08:44 } +2024-07-25 23:03:11,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1260/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 9.258643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.44013 samples/s/p 2:08:25 } +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1262/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 9.25302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43234 samples/s/p 2:08:33 } +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1264/ 1625], loss: 1.306, per_step_time: 1470ms, lr: 9.247399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43880 samples/s/p 2:08:21 } +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1266/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 9.2417795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.44025 samples/s/p 2:08:16 } +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1268/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 9.236161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43399 samples/s/p 2:08:22 } +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1270/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.230546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43450 samples/s/p 2:08:18 } +2024-07-25 23:03:29,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1272/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 9.2249265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:29,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43774 samples/s/p 2:08:11 } +2024-07-25 23:03:32,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1274/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 9.21931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:32,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43860 samples/s/p 2:08:07 } +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1276/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 9.2137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42819 samples/s/p 2:08:19 } +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1278/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 9.208084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43440 samples/s/p 2:08:07 } +2024-07-25 23:03:41,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1280/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 9.202471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:41,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43970 samples/s/p 2:07:56 } +2024-07-25 23:03:44,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1282/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.196864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:44,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43567 samples/s/p 2:07:59 } +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1284/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 9.191251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43419 samples/s/p 2:07:58 } +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1286/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 9.1856455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43417 samples/s/p 2:07:55 } +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1288/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 9.180038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42172 samples/s/p 2:08:10 } +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1290/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 9.174429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43169 samples/s/p 2:07:53 } +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1292/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.168827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:59,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43209 samples/s/p 2:07:49 } +2024-07-25 23:04:02,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1294/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 9.163223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:02,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.42877 samples/s/p 2:07:51 } +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1296/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 9.157618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43626 samples/s/p 2:07:38 } +2024-07-25 23:04:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1298/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 9.152019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43888 samples/s/p 2:07:31 } +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1300/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 9.146418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43738 samples/s/p 2:07:30 } +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1302/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 9.140819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43611 samples/s/p 2:07:29 } +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1304/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 9.13522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43489 samples/s/p 2:07:28 } +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1306/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 9.129623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43430 samples/s/p 2:07:26 } +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1308/ 1625], loss: 0.967, per_step_time: 1472ms, lr: 9.124028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43119 samples/s/p 2:07:27 } +2024-07-25 23:04:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1310/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.118434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.44013 samples/s/p 2:07:12 } +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1312/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 9.112841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43316 samples/s/p 2:07:19 } +2024-07-25 23:04:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1314/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 9.107252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43780 samples/s/p 2:07:09 } +2024-07-25 23:04:34,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1316/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 9.101657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43284 samples/s/p 2:07:13 } +2024-07-25 23:04:37,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1318/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 9.0960675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:37,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43905 samples/s/p 2:07:01 } +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1320/ 1625], loss: 1.109, per_step_time: 1474ms, lr: 9.090482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:40,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.42403 samples/s/p 2:07:20 } +2024-07-25 23:04:43,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1322/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 9.084893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:43,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43510 samples/s/p 2:07:01 } +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1324/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 9.079306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43154 samples/s/p 2:07:03 } +2024-07-25 23:04:49,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1326/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 9.073725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:49,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43550 samples/s/p 2:06:55 } +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1328/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 9.068137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43233 samples/s/p 2:06:56 } +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1330/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.062558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43600 samples/s/p 2:06:48 } +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1332/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 9.056976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.44061 samples/s/p 2:06:39 } +2024-07-25 23:05:01,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1334/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 9.051393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:01,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43538 samples/s/p 2:06:43 } +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1336/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 9.045816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43736 samples/s/p 2:06:37 } +2024-07-25 23:05:07,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1338/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 9.040239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:07,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43101 samples/s/p 2:06:43 } +2024-07-25 23:05:10,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1340/ 1625], loss: 0.975, per_step_time: 1472ms, lr: 9.034659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:10,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43456 samples/s/p 2:06:35 } +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1342/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 9.029087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43648 samples/s/p 2:06:30 } +2024-07-25 23:05:15,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1344/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 9.023513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:15,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43378 samples/s/p 2:06:31 } +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1346/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 9.017939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43828 samples/s/p 2:06:21 } +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1348/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 9.012367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:21,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43539 samples/s/p 2:06:22 } +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1350/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 9.006797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43787 samples/s/p 2:06:16 } +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1352/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 9.001227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.44002 samples/s/p 2:06:10 } +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1354/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 8.995658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42932 samples/s/p 2:06:22 } +2024-07-25 23:05:33,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1356/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 8.990091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42553 samples/s/p 2:06:24 } +2024-07-25 23:05:36,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1358/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 8.984529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:36,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43157 samples/s/p 2:06:13 } +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1360/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 8.978961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44063 samples/s/p 2:05:57 } +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1362/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 8.973397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43851 samples/s/p 2:05:57 } +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1364/ 1625], loss: 0.968, per_step_time: 1474ms, lr: 8.967838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.42696 samples/s/p 2:06:11 } +2024-07-25 23:05:48,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1366/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 8.962274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:48,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43041 samples/s/p 2:06:03 } +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1368/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 8.956715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:51,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43526 samples/s/p 2:05:53 } +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1370/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 8.951159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:54,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43882 samples/s/p 2:05:45 } +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1372/ 1625], loss: 1.034, per_step_time: 1468ms, lr: 8.945599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:57,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44802 samples/s/p 2:05:30 } +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1374/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 8.940045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43753 samples/s/p 2:05:41 } +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1376/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 8.93449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43633 samples/s/p 2:05:40 } +2024-07-25 23:06:06,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1378/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 8.928933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43189 samples/s/p 2:05:43 } +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1380/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 8.923384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:09,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42995 samples/s/p 2:05:43 } +2024-07-25 23:06:11,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1382/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 8.917832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:11,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42687 samples/s/p 2:05:44 } +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1384/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 8.912279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:14,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43165 samples/s/p 2:05:35 } +2024-07-25 23:06:17,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1386/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 8.906733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:17,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43032 samples/s/p 2:05:33 } +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1388/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 8.9011855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43816 samples/s/p 2:05:20 } +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1390/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 8.8956385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43960 samples/s/p 2:05:15 } +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1392/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 8.890093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43682 samples/s/p 2:05:16 } +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1394/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 8.884548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:29,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43397 samples/s/p 2:05:17 } +2024-07-25 23:06:32,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1396/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 8.879007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:32,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43700 samples/s/p 2:05:10 } +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1398/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 8.873465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42926 samples/s/p 2:05:17 } +2024-07-25 23:06:38,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1400/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 8.8679235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:38,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.44007 samples/s/p 2:04:59 } +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1402/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.862388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:41,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42897 samples/s/p 2:05:12 } +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1404/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 8.856847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43132 samples/s/p 2:05:06 } +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1406/ 1625], loss: 0.921, per_step_time: 1470ms, lr: 8.851311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44075 samples/s/p 2:04:50 } +2024-07-25 23:06:50,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1408/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 8.845777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:50,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43897 samples/s/p 2:04:49 } +2024-07-25 23:06:53,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1410/ 1625], loss: 1.035, per_step_time: 1473ms, lr: 8.840241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:53,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42750 samples/s/p 2:05:02 } +2024-07-25 23:06:56,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.834708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:56,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43793 samples/s/p 2:04:45 } +2024-07-25 23:06:59,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1414/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 8.829178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:59,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42946 samples/s/p 2:04:53 } +2024-07-25 23:07:02,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1416/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 8.823646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:02,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43693 samples/s/p 2:04:40 } +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1418/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 8.81812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43740 samples/s/p 2:04:37 } +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1420/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 8.81259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44058 samples/s/p 2:04:29 } +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1422/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 8.80706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44302 samples/s/p 2:04:23 } +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1424/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 8.801538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43182 samples/s/p 2:04:35 } +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1426/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 8.796013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44171 samples/s/p 2:04:19 } +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1428/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 8.79049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:19,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43958 samples/s/p 2:04:19 } +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1430/ 1625], loss: 1.459, per_step_time: 1470ms, lr: 8.7849685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43961 samples/s/p 2:04:16 } +2024-07-25 23:07:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1432/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 8.779447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43766 samples/s/p 2:04:16 } +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1434/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 8.773927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43019 samples/s/p 2:04:23 } +2024-07-25 23:07:31,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1436/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 8.76841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:31,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43043 samples/s/p 2:04:20 } +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1438/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.762892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43380 samples/s/p 2:04:12 } +2024-07-25 23:07:37,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1440/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 8.757377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:37,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43380 samples/s/p 2:04:09 } +2024-07-25 23:07:40,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1442/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.751863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:40,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43126 samples/s/p 2:04:10 } +2024-07-25 23:07:43,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1444/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 8.746349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:43,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43297 samples/s/p 2:04:04 } +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1446/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 8.740837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43764 samples/s/p 2:03:55 } +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1448/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.7353255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:49,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43021 samples/s/p 2:04:02 } +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1450/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.729817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43692 samples/s/p 2:03:50 } +2024-07-25 23:07:52,300 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:08:28,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1452/ 1625], loss: 1.025, per_step_time: 1578ms, lr: 8.724312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:28,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.06854 samples/s/p 2:12:47 } +2024-07-25 23:08:31,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1454/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 8.718801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:31,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43528 samples/s/p 2:03:47 } +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1456/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 8.713299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.42793 samples/s/p 2:03:54 } +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1458/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 8.707794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44165 samples/s/p 2:03:32 } +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1460/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 8.702288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44010 samples/s/p 2:03:31 } +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1462/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 8.696789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43793 samples/s/p 2:03:31 } +2024-07-25 23:08:46,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1464/ 1625], loss: 1.277, per_step_time: 1477ms, lr: 8.691288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:46,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.41288 samples/s/p 2:04:02 } +2024-07-25 23:08:49,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1466/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.685786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:49,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43545 samples/s/p 2:03:29 } +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1468/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 8.680291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43568 samples/s/p 2:03:25 } +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1470/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 8.674794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:55,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43589 samples/s/p 2:03:22 } +2024-07-25 23:08:58,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1472/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 8.669298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:58,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43599 samples/s/p 2:03:19 } +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1474/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 8.663804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42914 samples/s/p 2:03:25 } +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1476/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 8.658311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43472 samples/s/p 2:03:15 } +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1478/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 8.652818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43437 samples/s/p 2:03:12 } +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1480/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 8.647328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42696 samples/s/p 2:03:20 } +2024-07-25 23:09:13,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1482/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 8.641839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:13,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42862 samples/s/p 2:03:14 } +2024-07-25 23:09:16,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1484/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.63635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43259 samples/s/p 2:03:06 } +2024-07-25 23:09:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1486/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.630864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43667 samples/s/p 2:02:58 } +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1488/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 8.625377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43563 samples/s/p 2:02:56 } +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1490/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 8.619893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43112 samples/s/p 2:02:59 } +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1492/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 8.614409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43825 samples/s/p 2:02:47 } +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1494/ 1625], loss: 0.945, per_step_time: 1474ms, lr: 8.6089285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.42585 samples/s/p 2:03:00 } +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1496/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 8.603447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:33,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43586 samples/s/p 2:02:44 } +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1498/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 8.597967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:36,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43445 samples/s/p 2:02:43 } +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1500/ 1625], loss: 1.192, per_step_time: 1469ms, lr: 8.592493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.44304 samples/s/p 2:02:28 } +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1502/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 8.587017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43520 samples/s/p 2:02:36 } +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1504/ 1625], loss: 1.001, per_step_time: 1470ms, lr: 8.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43850 samples/s/p 2:02:29 } +2024-07-25 23:09:48,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1506/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 8.576068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:48,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43659 samples/s/p 2:02:28 } +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1508/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 8.570594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43091 samples/s/p 2:02:33 } +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1510/ 1625], loss: 1.236, per_step_time: 1474ms, lr: 8.565119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42581 samples/s/p 2:02:37 } +2024-07-25 23:09:57,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1512/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 8.559652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:57,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42851 samples/s/p 2:02:30 } +2024-07-25 23:10:00,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1514/ 1625], loss: 0.986, per_step_time: 1469ms, lr: 8.554183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:00,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.44424 samples/s/p 2:02:06 } +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1516/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 8.548715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43871 samples/s/p 2:02:11 } +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1518/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 8.543249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43870 samples/s/p 2:02:08 } +2024-07-25 23:10:09,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1520/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 8.537784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:09,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.44105 samples/s/p 2:02:02 } +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1522/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.532321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43105 samples/s/p 2:02:12 } +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1524/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.5268575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:15,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43359 samples/s/p 2:02:06 } +2024-07-25 23:10:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1526/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 8.521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43829 samples/s/p 2:01:56 } +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1528/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 8.515936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43387 samples/s/p 2:02:00 } +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1530/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 8.5104775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:23,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43878 samples/s/p 2:01:50 } +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1532/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 8.505021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:26,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43581 samples/s/p 2:01:51 } +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1534/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 8.499564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43796 samples/s/p 2:01:45 } +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1536/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 8.494109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43836 samples/s/p 2:01:42 } +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1538/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 8.488656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42959 samples/s/p 2:01:51 } +2024-07-25 23:10:38,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1540/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 8.483204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:38,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.44030 samples/s/p 2:01:33 } +2024-07-25 23:10:41,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1542/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 8.477753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:41,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42979 samples/s/p 2:01:44 } +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1544/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 8.472306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43673 samples/s/p 2:01:32 } +2024-07-25 23:10:47,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1546/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 8.4668545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:47,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42667 samples/s/p 2:01:43 } +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1548/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 8.461408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43167 samples/s/p 2:01:33 } +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1550/ 1625], loss: 1.124, per_step_time: 1482ms, lr: 8.455965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.39681 samples/s/p 2:02:17 } +2024-07-25 23:10:56,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1552/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 8.45052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:56,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.42954 samples/s/p 2:01:30 } +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1554/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 8.445074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43412 samples/s/p 2:01:21 } +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1556/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 8.439636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43846 samples/s/p 2:01:12 } +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1558/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 8.434195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43700 samples/s/p 2:01:11 } +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1560/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 8.428756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43797 samples/s/p 2:01:07 } +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1562/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 8.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43687 samples/s/p 2:01:05 } +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1564/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.41788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:14,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43641 samples/s/p 2:01:03 } +2024-07-25 23:11:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1566/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 8.412446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43250 samples/s/p 2:01:05 } +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1568/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.407012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43786 samples/s/p 2:00:55 } +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1570/ 1625], loss: 1.127, per_step_time: 1474ms, lr: 8.401578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.42719 samples/s/p 2:01:07 } +2024-07-25 23:11:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1572/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 8.396148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.44249 samples/s/p 2:00:43 } +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1574/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 8.390716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:28,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43906 samples/s/p 2:00:45 } +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1576/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 8.385287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:31,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43897 samples/s/p 2:00:42 } +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1578/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 8.37986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43715 samples/s/p 2:00:42 } +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1580/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.3744335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43741 samples/s/p 2:00:38 } +2024-07-25 23:11:40,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1582/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 8.369009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:40,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43691 samples/s/p 2:00:36 } +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1584/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 8.363585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43497 samples/s/p 2:00:36 } +2024-07-25 23:11:46,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1586/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 8.358163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.41976 samples/s/p 2:00:53 } +2024-07-25 23:11:49,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1588/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 8.352746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:49,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43629 samples/s/p 2:00:28 } +2024-07-25 23:11:52,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1590/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.347323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:52,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43401 samples/s/p 2:00:28 } +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1592/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 8.3419045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43162 samples/s/p 2:00:28 } +2024-07-25 23:11:58,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1594/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 8.33649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:58,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43046 samples/s/p 2:00:27 } +2024-07-25 23:12:01,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1596/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 8.3310715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:01,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43980 samples/s/p 2:00:12 } +2024-07-25 23:12:04,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1598/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 8.325661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:04,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43479 samples/s/p 2:00:15 } +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.320248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43547 samples/s/p 2:00:11 } +2024-07-25 23:12:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1602/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 8.314836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43732 samples/s/p 2:00:06 } +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1604/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 8.3094255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43919 samples/s/p 2:00:01 } +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1606/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 8.304017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43365 samples/s/p 2:00:05 } +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1608/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 8.298609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43043 samples/s/p 2:00:06 } +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1610/ 1625], loss: 0.941, per_step_time: 1471ms, lr: 8.293203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43493 samples/s/p 1:59:57 } +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1612/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.287798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43978 samples/s/p 1:59:48 } +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1614/ 1625], loss: 1.266, per_step_time: 1476ms, lr: 8.282394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.41695 samples/s/p 2:00:15 } +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1616/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 8.276991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43099 samples/s/p 1:59:54 } +2024-07-25 23:12:33,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1618/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.271591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:33,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43608 samples/s/p 1:59:44 } +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1620/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 8.266191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43624 samples/s/p 1:59:41 } +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1622/ 1625], loss: 1.037, per_step_time: 1470ms, lr: 8.260793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43945 samples/s/p 1:59:34 } +2024-07-25 23:12:42,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1624/ 1625], loss: 1.285, per_step_time: 1475ms, lr: 8.255394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:42,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.42355 samples/s/p 1:59:52 } +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 8.250003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43781 samples/s/p 1:59:30 } +2024-07-25 23:12:48,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 3/ 1625], loss: 1.046, per_step_time: 1472ms, lr: 8.244605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:48,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43446 samples/s/p 1:59:32 } +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 5/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 8.239212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43409 samples/s/p 1:59:29 } +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 7/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 8.233824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.44037 samples/s/p 1:59:18 } +2024-07-25 23:12:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 9/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 8.2284305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43598 samples/s/p 1:59:21 } +2024-07-25 23:13:00,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 11/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 8.223042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:00,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43775 samples/s/p 1:59:15 } +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 13/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 8.217657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43832 samples/s/p 1:59:12 } +2024-07-25 23:13:06,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 15/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 8.212267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:06,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43521 samples/s/p 1:59:13 } +2024-07-25 23:13:09,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 17/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.2068855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:09,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43406 samples/s/p 1:59:11 } +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 19/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.201501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:12,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43712 samples/s/p 1:59:04 } +2024-07-25 23:13:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 21/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 8.196116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.44077 samples/s/p 1:58:57 } +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 23/ 1625], loss: 1.287, per_step_time: 1474ms, lr: 8.190739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.42410 samples/s/p 1:59:16 } +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 25/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 8.185359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43434 samples/s/p 1:58:59 } +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 27/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.179981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43845 samples/s/p 1:58:51 } +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 29/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 8.174604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43754 samples/s/p 1:58:49 } +2024-07-25 23:13:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 31/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 8.169228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:29,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43219 samples/s/p 1:58:53 } +2024-07-25 23:13:32,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 33/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.163854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:32,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43676 samples/s/p 1:58:44 } +2024-07-25 23:13:35,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 35/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.158482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:35,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43489 samples/s/p 1:58:44 } +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 37/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.153111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43501 samples/s/p 1:58:41 } +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 39/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 8.14774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43501 samples/s/p 1:58:38 } +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 41/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 8.1423705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43653 samples/s/p 1:58:33 } +2024-07-25 23:13:47,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 43/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 8.1370035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:47,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43878 samples/s/p 1:58:27 } +2024-07-25 23:13:50,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 45/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 8.13164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:50,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43703 samples/s/p 1:58:26 } +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 47/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 8.126273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:53,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43458 samples/s/p 1:58:27 } +2024-07-25 23:13:56,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 49/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 8.120909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42343 samples/s/p 1:58:38 } +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 51/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 8.11555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43231 samples/s/p 1:58:24 } +2024-07-25 23:14:02,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 53/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 8.110187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:02,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42067 samples/s/p 1:58:36 } +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 55/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 8.104828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43739 samples/s/p 1:58:11 } +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 57/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 8.099473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43330 samples/s/p 1:58:14 } +2024-07-25 23:14:11,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 59/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 8.094114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:11,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43677 samples/s/p 1:58:06 } +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 61/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 8.088761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43968 samples/s/p 1:57:59 } +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 63/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 8.083408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43847 samples/s/p 1:57:58 } +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 65/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 8.078052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43458 samples/s/p 1:58:00 } +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 67/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 8.072704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:22,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43804 samples/s/p 1:57:53 } +2024-07-25 23:14:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 69/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 8.067355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:25,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43311 samples/s/p 1:57:56 } +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 71/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 8.062004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43940 samples/s/p 1:57:45 } +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 73/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 8.05666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:31,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43235 samples/s/p 1:57:51 } +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 75/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.051315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:34,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43288 samples/s/p 1:57:48 } +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 77/ 1625], loss: 0.892, per_step_time: 1470ms, lr: 8.0459695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:37,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.44108 samples/s/p 1:57:34 } +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 79/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 8.040627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42886 samples/s/p 1:57:47 } +2024-07-25 23:14:43,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 81/ 1625], loss: 1.188, per_step_time: 1475ms, lr: 8.035286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:43,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42116 samples/s/p 1:57:54 } +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 83/ 1625], loss: 0.976, per_step_time: 1473ms, lr: 8.029945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42950 samples/s/p 1:57:40 } +2024-07-25 23:14:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 85/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 8.024606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:49,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43227 samples/s/p 1:57:34 } +2024-07-25 23:14:52,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 87/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 8.019269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:52,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43658 samples/s/p 1:57:25 } +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 89/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.013937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43538 samples/s/p 1:57:24 } +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 91/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 8.008599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43149 samples/s/p 1:57:26 } +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 93/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 8.003266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43513 samples/s/p 1:57:18 } +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 95/ 1625], loss: 1.204, per_step_time: 1468ms, lr: 7.997937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.44688 samples/s/p 1:57:00 } +2024-07-25 23:15:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 97/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 7.992605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43505 samples/s/p 1:57:12 } +2024-07-25 23:15:10,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 99/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 7.987275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:10,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43309 samples/s/p 1:57:12 } +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 101/ 1625], loss: 0.903, per_step_time: 1473ms, lr: 7.981951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.42988 samples/s/p 1:57:13 } +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 103/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 7.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43682 samples/s/p 1:57:01 } +2024-07-25 23:15:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 105/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 7.9713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:19,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43459 samples/s/p 1:57:01 } +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 7.965976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43767 samples/s/p 1:56:54 } +2024-07-25 23:15:24,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 109/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 7.960652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:24,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42987 samples/s/p 1:57:01 } +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 111/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 7.955334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.44111 samples/s/p 1:56:44 } +2024-07-25 23:15:30,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 113/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.950014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:30,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43751 samples/s/p 1:56:46 } +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 115/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 7.944696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43926 samples/s/p 1:56:40 } +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 117/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.93938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43438 samples/s/p 1:56:44 } +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 119/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 7.934065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43616 samples/s/p 1:56:39 } +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 121/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 7.928752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42757 samples/s/p 1:56:47 } +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 123/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 7.923439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:45,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44142 samples/s/p 1:56:26 } +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.918128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44053 samples/s/p 1:56:24 } +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 127/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 7.912819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:51,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43279 samples/s/p 1:56:31 } +2024-07-25 23:15:54,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 129/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 7.907511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:54,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43034 samples/s/p 1:56:31 } +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 131/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 7.902204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43170 samples/s/p 1:56:27 } +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 133/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 7.8969015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43882 samples/s/p 1:56:15 } +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 135/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 7.8915955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43781 samples/s/p 1:56:13 } +2024-07-25 23:16:06,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 137/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 7.886293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:06,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43811 samples/s/p 1:56:10 } +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 139/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 7.880994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:09,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43626 samples/s/p 1:56:09 } +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 141/ 1625], loss: 0.940, per_step_time: 1471ms, lr: 7.875692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43511 samples/s/p 1:56:08 } +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 143/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 7.870396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44038 samples/s/p 1:55:58 } +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 145/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.8651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44070 samples/s/p 1:55:54 } +2024-07-25 23:16:20,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 147/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 7.859801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:20,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.42803 samples/s/p 1:56:08 } +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 149/ 1625], loss: 0.906, per_step_time: 1470ms, lr: 7.85451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43937 samples/s/p 1:55:50 } +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 151/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 7.8492185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43628 samples/s/p 1:55:51 } +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 153/ 1625], loss: 1.019, per_step_time: 1472ms, lr: 7.843923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43470 samples/s/p 1:55:50 } +2024-07-25 23:16:32,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 155/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.838637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:32,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43930 samples/s/p 1:55:42 } +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 157/ 1625], loss: 1.018, per_step_time: 1472ms, lr: 7.833349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43410 samples/s/p 1:55:45 } +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 159/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 7.828062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43819 samples/s/p 1:55:37 } +2024-07-25 23:16:41,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 161/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 7.822776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:41,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43780 samples/s/p 1:55:35 } +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 163/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 7.817492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43373 samples/s/p 1:55:37 } +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 165/ 1625], loss: 1.167, per_step_time: 1469ms, lr: 7.812209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.44567 samples/s/p 1:55:19 } +2024-07-25 23:16:50,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 7.806928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:50,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43723 samples/s/p 1:55:27 } +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 169/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 7.801648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43045 samples/s/p 1:55:32 } +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 171/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 7.7963705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43640 samples/s/p 1:55:22 } +2024-07-25 23:16:59,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 173/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 7.791093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:59,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.42996 samples/s/p 1:55:27 } +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 175/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 7.785818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:02,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44232 samples/s/p 1:55:08 } +2024-07-25 23:17:05,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 177/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 7.780546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:05,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44153 samples/s/p 1:55:06 } +2024-07-25 23:17:08,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 179/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 7.77527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:08,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43969 samples/s/p 1:55:06 } +2024-07-25 23:17:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 181/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 7.77e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44206 samples/s/p 1:55:00 } +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 183/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.764732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44007 samples/s/p 1:54:59 } +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 185/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 7.7594605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44027 samples/s/p 1:54:56 } +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 187/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.754196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43990 samples/s/p 1:54:54 } +2024-07-25 23:17:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 189/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 7.748931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:22,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43135 samples/s/p 1:55:02 } +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 191/ 1625], loss: 1.170, per_step_time: 1469ms, lr: 7.743663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:25,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44415 samples/s/p 1:54:42 } +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 193/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 7.738405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43189 samples/s/p 1:54:55 } +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 195/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 7.733143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43090 samples/s/p 1:54:53 } +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 197/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 7.72788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:34,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43064 samples/s/p 1:54:51 } +2024-07-25 23:17:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 199/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 7.722625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43864 samples/s/p 1:54:38 } +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 201/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 7.717367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43186 samples/s/p 1:54:43 } +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 203/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 7.712112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:43,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43555 samples/s/p 1:54:36 } +2024-07-25 23:17:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 205/ 1625], loss: 0.943, per_step_time: 1471ms, lr: 7.706858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:46,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43632 samples/s/p 1:54:32 } +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 207/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 7.701605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43240 samples/s/p 1:54:34 } +2024-07-25 23:17:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 209/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 7.696354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:52,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.42971 samples/s/p 1:54:34 } +2024-07-25 23:17:55,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 211/ 1625], loss: 1.014, per_step_time: 1477ms, lr: 7.691104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:55,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.41279 samples/s/p 1:54:53 } +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 213/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 7.685856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43393 samples/s/p 1:54:23 } +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 215/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 7.680609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:01,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.44168 samples/s/p 1:54:10 } +2024-07-25 23:18:04,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 217/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 7.675363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:04,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43493 samples/s/p 1:54:16 } +2024-07-25 23:18:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 219/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 7.67012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43430 samples/s/p 1:54:14 } +2024-07-25 23:18:10,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 221/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 7.664877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:10,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43901 samples/s/p 1:54:05 } +2024-07-25 23:18:13,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 223/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 7.659636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:13,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.42885 samples/s/p 1:54:15 } +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 225/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.654396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43986 samples/s/p 1:53:58 } +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 227/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 7.649158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:19,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43733 samples/s/p 1:53:58 } +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 229/ 1625], loss: 0.986, per_step_time: 1482ms, lr: 7.643921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.39528 samples/s/p 1:54:48 } +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 231/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 7.638689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44041 samples/s/p 1:53:48 } +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 233/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 7.6334545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44142 samples/s/p 1:53:44 } +2024-07-25 23:18:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 235/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.628219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43176 samples/s/p 1:53:53 } +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 7.6229917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43594 samples/s/p 1:53:45 } +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 239/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 7.617762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43454 samples/s/p 1:53:44 } +2024-07-25 23:18:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 241/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 7.6125307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:39,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43195 samples/s/p 1:53:44 } +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 243/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 7.607307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:42,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43277 samples/s/p 1:53:40 } +2024-07-25 23:18:45,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.602082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:45,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43318 samples/s/p 1:53:37 } +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 247/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 7.5968583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43927 samples/s/p 1:53:26 } +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 249/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 7.5916355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.44054 samples/s/p 1:53:22 } +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 251/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.586415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:54,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43698 samples/s/p 1:53:23 } +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 253/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 7.581196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43716 samples/s/p 1:53:20 } +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 255/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 7.575978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44078 samples/s/p 1:53:13 } +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 257/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 7.5707617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44123 samples/s/p 1:53:09 } +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 259/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 7.5655466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:06,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43038 samples/s/p 1:53:20 } +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 261/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 7.5603334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43685 samples/s/p 1:53:09 } +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 263/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.555121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43766 samples/s/p 1:53:05 } +2024-07-25 23:19:15,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 265/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 7.54991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44046 samples/s/p 1:52:58 } +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 267/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 7.5447015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43462 samples/s/p 1:53:03 } +2024-07-25 23:19:20,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 269/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.5394933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43241 samples/s/p 1:53:02 } +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 271/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.5342878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43623 samples/s/p 1:52:55 } +2024-07-25 23:19:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 273/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 7.529083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:26,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43609 samples/s/p 1:52:52 } +2024-07-25 23:19:29,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 275/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 7.5238827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43877 samples/s/p 1:52:46 } +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 277/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 7.518678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43722 samples/s/p 1:52:45 } +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 279/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 7.513478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43550 samples/s/p 1:52:44 } +2024-07-25 23:19:38,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 281/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 7.508282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43370 samples/s/p 1:52:43 } +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 283/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 7.5030853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43793 samples/s/p 1:52:35 } +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 285/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 7.4978893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44012 samples/s/p 1:52:29 } +2024-07-25 23:19:47,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 287/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 7.492694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43971 samples/s/p 1:52:27 } +2024-07-25 23:19:50,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 289/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 7.4875015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:50,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43325 samples/s/p 1:52:32 } +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 291/ 1625], loss: 1.135, per_step_time: 1475ms, lr: 7.4823097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42094 samples/s/p 1:52:44 } +2024-07-25 23:19:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 293/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.4771206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:56,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43211 samples/s/p 1:52:28 } +2024-07-25 23:19:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 295/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 7.471932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:59,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44156 samples/s/p 1:52:13 } +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 297/ 1625], loss: 1.064, per_step_time: 1473ms, lr: 7.4667446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42803 samples/s/p 1:52:27 } +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 299/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 7.4615587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43829 samples/s/p 1:52:11 } +2024-07-25 23:20:08,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 301/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 7.456376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:08,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43589 samples/s/p 1:52:11 } +2024-07-25 23:20:11,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 303/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 7.4511927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:11,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43411 samples/s/p 1:52:10 } +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 305/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 7.446012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43572 samples/s/p 1:52:05 } +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 307/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 7.4408326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42771 samples/s/p 1:52:12 } +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 309/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 7.435654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42852 samples/s/p 1:52:08 } +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 311/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 7.430478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43719 samples/s/p 1:51:55 } +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 313/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 7.4253053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43802 samples/s/p 1:51:51 } +2024-07-25 23:20:28,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 315/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 7.4201294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43914 samples/s/p 1:51:46 } +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 317/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 7.4149575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43412 samples/s/p 1:51:50 } +2024-07-25 23:20:34,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 319/ 1625], loss: 0.999, per_step_time: 1469ms, lr: 7.4097893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:34,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.44280 samples/s/p 1:51:36 } +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 321/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 7.4046175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43078 samples/s/p 1:51:48 } +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 323/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 7.39945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.42554 samples/s/p 1:51:51 } +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 325/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.394287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43474 samples/s/p 1:51:37 } +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 327/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.389119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43674 samples/s/p 1:51:32 } +2024-07-25 23:20:49,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 329/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 7.3839587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:49,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43344 samples/s/p 1:51:33 } +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 331/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 7.3787974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43377 samples/s/p 1:51:30 } +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 333/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 7.373637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43376 samples/s/p 1:51:27 } +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 335/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 7.368479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43407 samples/s/p 1:51:23 } +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 337/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.363322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.44013 samples/s/p 1:51:13 } +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 339/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 7.3581655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43846 samples/s/p 1:51:12 } +2024-07-25 23:21:07,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 341/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 7.353012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:07,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43949 samples/s/p 1:51:08 } +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 343/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 7.347859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:10,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.42782 samples/s/p 1:51:19 } +2024-07-25 23:21:13,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 345/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 7.342708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43388 samples/s/p 1:51:09 } +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 347/ 1625], loss: 1.077, per_step_time: 1469ms, lr: 7.337559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.44263 samples/s/p 1:50:55 } +2024-07-25 23:21:19,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 349/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 7.3324104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:19,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43184 samples/s/p 1:51:05 } +2024-07-25 23:21:21,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 351/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 7.3272636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:21,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44405 samples/s/p 1:50:47 } +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 353/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 7.3221186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43237 samples/s/p 1:50:59 } +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 355/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 7.3169754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44183 samples/s/p 1:50:44 } +2024-07-25 23:21:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 7.311836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:30,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43472 samples/s/p 1:50:50 } +2024-07-25 23:21:33,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 359/ 1625], loss: 1.053, per_step_time: 1476ms, lr: 7.3066926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:33,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.42002 samples/s/p 1:51:05 } +2024-07-25 23:21:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 361/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 7.3015535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:36,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44056 samples/s/p 1:50:37 } +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 363/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.296419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43677 samples/s/p 1:50:39 } +2024-07-25 23:21:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 365/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 7.29128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:42,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43607 samples/s/p 1:50:37 } +2024-07-25 23:21:45,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 367/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 7.2861453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:45,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43845 samples/s/p 1:50:31 } +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 369/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 7.2810158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44007 samples/s/p 1:50:26 } +2024-07-25 23:21:51,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 371/ 1625], loss: 1.237, per_step_time: 1469ms, lr: 7.275881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:51,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44402 samples/s/p 1:50:18 } +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 373/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 7.2707544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43516 samples/s/p 1:50:26 } +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 375/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 7.2656258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43318 samples/s/p 1:50:25 } +2024-07-25 23:22:00,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 377/ 1625], loss: 1.169, per_step_time: 1469ms, lr: 7.2604957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:00,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44246 samples/s/p 1:50:11 } +2024-07-25 23:22:03,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 379/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 7.255374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:03,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43420 samples/s/p 1:50:18 } +2024-07-25 23:22:06,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 381/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 7.25025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:06,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43303 samples/s/p 1:50:17 } +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 383/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 7.245127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:09,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43673 samples/s/p 1:50:09 } +2024-07-25 23:22:12,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 385/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 7.2400067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43320 samples/s/p 1:50:11 } +2024-07-25 23:22:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 387/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 7.2348876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43238 samples/s/p 1:50:09 } +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 389/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 7.2297703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43999 samples/s/p 1:49:57 } +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 391/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 7.2246526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:20,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43791 samples/s/p 1:49:56 } +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 393/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 7.219539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.42777 samples/s/p 1:50:06 } +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 395/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 7.214425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43509 samples/s/p 1:49:54 } +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 397/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 7.209314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43667 samples/s/p 1:49:49 } +2024-07-25 23:22:32,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 399/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 7.2042035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:32,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43339 samples/s/p 1:49:50 } +2024-07-25 23:22:35,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 401/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 7.199098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:35,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.42396 samples/s/p 1:49:58 } +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 403/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 7.1939876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43153 samples/s/p 1:49:46 } +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 405/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 7.1888826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43826 samples/s/p 1:49:35 } +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 407/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 7.183781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43668 samples/s/p 1:49:34 } +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 409/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 7.1786762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43164 samples/s/p 1:49:37 } +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 411/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 7.1735753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43632 samples/s/p 1:49:29 } +2024-07-25 23:22:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 413/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 7.168479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:53,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43950 samples/s/p 1:49:22 } +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 415/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.163378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:56,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43692 samples/s/p 1:49:22 } +2024-07-25 23:22:59,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 417/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.158285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:59,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43980 samples/s/p 1:49:16 } +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 419/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 7.15319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43340 samples/s/p 1:49:20 } +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 421/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.148094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43498 samples/s/p 1:49:16 } +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 423/ 1625], loss: 1.299, per_step_time: 1470ms, lr: 7.1430045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:08,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43951 samples/s/p 1:49:07 } +2024-07-25 23:23:11,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 425/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 7.137915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:11,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.44013 samples/s/p 1:49:03 } +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 427/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 7.1328236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43856 samples/s/p 1:49:02 } +2024-07-25 23:23:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 429/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 7.127739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43797 samples/s/p 1:49:00 } +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 431/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 7.1226536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:19,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42915 samples/s/p 1:49:08 } +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 433/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 7.117569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:22,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43663 samples/s/p 1:48:56 } +2024-07-25 23:23:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 435/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 7.1124873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43802 samples/s/p 1:48:51 } +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 437/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 7.1074064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43751 samples/s/p 1:48:49 } +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 439/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.102327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.44241 samples/s/p 1:48:40 } +2024-07-25 23:23:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 441/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 7.097249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43609 samples/s/p 1:48:45 } +2024-07-25 23:23:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 443/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 7.092173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43582 samples/s/p 1:48:42 } +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 445/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 7.087101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42909 samples/s/p 1:48:47 } +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 447/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 7.082025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43775 samples/s/p 1:48:34 } +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 449/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.076954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43855 samples/s/p 1:48:30 } +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 451/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 7.0718866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43303 samples/s/p 1:48:34 } +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 453/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 7.066815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43517 samples/s/p 1:48:28 } +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 455/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 7.061751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:55,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43556 samples/s/p 1:48:25 } +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 457/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 7.0566857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43781 samples/s/p 1:48:19 } +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 459/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 7.0516194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:01,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43148 samples/s/p 1:48:24 } +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 461/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 7.0465603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43437 samples/s/p 1:48:17 } +2024-07-25 23:24:07,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 463/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 7.0415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:07,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43850 samples/s/p 1:48:10 } +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 465/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.0364367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.44057 samples/s/p 1:48:04 } +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 467/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 7.0313827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43514 samples/s/p 1:48:08 } +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 469/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 7.026327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43090 samples/s/p 1:48:10 } +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 471/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 7.0212723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43479 samples/s/p 1:48:02 } +2024-07-25 23:24:21,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 473/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 7.016219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43704 samples/s/p 1:47:57 } +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 475/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 7.0111682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:24,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43902 samples/s/p 1:47:51 } +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 477/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 7.0061183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43155 samples/s/p 1:47:57 } +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 479/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 7.00107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43336 samples/s/p 1:47:52 } +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 481/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.996024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43206 samples/s/p 1:47:51 } +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 483/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 6.9909815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43077 samples/s/p 1:47:49 } +2024-07-25 23:24:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 485/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 6.985936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:39,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42809 samples/s/p 1:47:50 } +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 487/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 6.980893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43393 samples/s/p 1:47:40 } +2024-07-25 23:24:45,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 489/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.975856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:45,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43562 samples/s/p 1:47:35 } +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 491/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 6.970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42831 samples/s/p 1:47:40 } +2024-07-25 23:24:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 493/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 6.965778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43420 samples/s/p 1:47:30 } +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 495/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 6.9607454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42997 samples/s/p 1:47:33 } +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 497/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 6.955708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43302 samples/s/p 1:47:26 } +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 499/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 6.950678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43925 samples/s/p 1:47:16 } +2024-07-25 23:25:03,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 501/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 6.9456473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:03,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43184 samples/s/p 1:47:22 } +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 503/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 6.9406155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.42986 samples/s/p 1:47:21 } +2024-07-25 23:25:09,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 505/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 6.9355906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:09,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43928 samples/s/p 1:47:07 } +2024-07-25 23:25:12,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 507/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 6.9305643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43252 samples/s/p 1:47:12 } +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 509/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 6.9255375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43964 samples/s/p 1:47:01 } +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 511/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 6.920517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43549 samples/s/p 1:47:02 } +2024-07-25 23:25:20,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 513/ 1625], loss: 1.141, per_step_time: 1477ms, lr: 6.9154958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.41534 samples/s/p 1:47:23 } +2024-07-25 23:25:23,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 515/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 6.910476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:23,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43090 samples/s/p 1:47:02 } +2024-07-25 23:25:26,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 517/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 6.905458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43087 samples/s/p 1:46:59 } +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 519/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.900441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:29,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43721 samples/s/p 1:46:49 } +2024-07-25 23:25:32,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 521/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 6.8954255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.44150 samples/s/p 1:46:41 } +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 523/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 6.890413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.42967 samples/s/p 1:46:52 } +2024-07-25 23:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 525/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 6.885401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:38,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43277 samples/s/p 1:46:45 } +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 527/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 6.880391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43165 samples/s/p 1:46:43 } +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 529/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 6.8753825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43454 samples/s/p 1:46:37 } +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 531/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 6.870375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:47,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43069 samples/s/p 1:46:39 } +2024-07-25 23:25:50,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 533/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 6.8653726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:50,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43515 samples/s/p 1:46:30 } +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 535/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 6.860366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43549 samples/s/p 1:46:27 } +2024-07-25 23:25:56,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 537/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 6.8553636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:56,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43599 samples/s/p 1:46:24 } +2024-07-25 23:25:59,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 539/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 6.8503664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:59,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43245 samples/s/p 1:46:25 } +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 541/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 6.8453637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43947 samples/s/p 1:46:14 } +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 543/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 6.840369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43873 samples/s/p 1:46:12 } +2024-07-25 23:26:08,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 545/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 6.835374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:08,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43536 samples/s/p 1:46:13 } +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 547/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 6.8303757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43180 samples/s/p 1:46:14 } +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 549/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 6.825386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43766 samples/s/p 1:46:04 } +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 551/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 6.8203954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43486 samples/s/p 1:46:04 } +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 553/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.815403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43326 samples/s/p 1:46:03 } +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 555/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 6.810418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43667 samples/s/p 1:45:56 } +2024-07-25 23:26:25,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 557/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 6.8054314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:25,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43763 samples/s/p 1:45:52 } +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 559/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 6.800447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43287 samples/s/p 1:45:55 } +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 561/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 6.795464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.42931 samples/s/p 1:45:56 } +2024-07-25 23:26:34,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 563/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.790483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:34,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43474 samples/s/p 1:45:47 } +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 565/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 6.785503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43390 samples/s/p 1:45:45 } +2024-07-25 23:26:40,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 567/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 6.780525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:40,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43066 samples/s/p 1:45:46 } +2024-07-25 23:26:43,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 569/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 6.7755473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:43,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43306 samples/s/p 1:45:40 } +2024-07-25 23:26:46,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 571/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 6.770573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:46,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43262 samples/s/p 1:45:38 } +2024-07-25 23:26:49,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 573/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 6.7655997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:49,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43487 samples/s/p 1:45:32 } +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 575/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.7606275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43552 samples/s/p 1:45:28 } +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 577/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 6.755657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43473 samples/s/p 1:45:26 } +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 579/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 6.7506894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43498 samples/s/p 1:45:23 } +2024-07-25 23:27:01,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 581/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 6.7457217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:01,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43064 samples/s/p 1:45:25 } +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 583/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 6.74076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:04,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.42908 samples/s/p 1:45:24 } +2024-07-25 23:27:07,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 585/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 6.735793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:07,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43428 samples/s/p 1:45:15 } +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 587/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 6.730834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43579 samples/s/p 1:45:10 } +2024-07-25 23:27:13,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 589/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.725873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:13,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43203 samples/s/p 1:45:12 } +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 591/ 1625], loss: 1.129, per_step_time: 1482ms, lr: 6.720911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.39663 samples/s/p 1:45:50 } +2024-07-25 23:27:19,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 593/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 6.715957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43557 samples/s/p 1:45:02 } +2024-07-25 23:27:22,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 595/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 6.7110013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:22,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43458 samples/s/p 1:45:00 } +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 597/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 6.7060473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43418 samples/s/p 1:44:57 } +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 599/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 6.701095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:27,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43924 samples/s/p 1:44:49 } +2024-07-25 23:27:30,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 601/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 6.6961447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:30,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43770 samples/s/p 1:44:47 } +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 603/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 6.691195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:33,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43920 samples/s/p 1:44:43 } +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 605/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 6.686248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43657 samples/s/p 1:44:43 } +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 607/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 6.681302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43659 samples/s/p 1:44:40 } +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 609/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 6.6763573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.42765 samples/s/p 1:44:47 } +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 611/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 6.6714156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.44044 samples/s/p 1:44:30 } +2024-07-25 23:27:48,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 613/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 6.6664743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:48,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43579 samples/s/p 1:44:32 } +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 615/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43722 samples/s/p 1:44:27 } +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 617/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 6.6565976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43493 samples/s/p 1:44:27 } +2024-07-25 23:27:57,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 619/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.651661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:57,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43134 samples/s/p 1:44:28 } +2024-07-25 23:28:00,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 621/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 6.646727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:00,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43535 samples/s/p 1:44:21 } +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 6.6417933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43422 samples/s/p 1:44:19 } +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 625/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 6.6368652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43836 samples/s/p 1:44:11 } +2024-07-25 23:28:09,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 627/ 1625], loss: 1.269, per_step_time: 1475ms, lr: 6.631933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:09,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42274 samples/s/p 1:44:26 } +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 629/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 6.627005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43756 samples/s/p 1:44:06 } +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 631/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 6.6220814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43622 samples/s/p 1:44:05 } +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 633/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 6.6171565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43050 samples/s/p 1:44:09 } +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 635/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 6.612231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43326 samples/s/p 1:44:03 } +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 637/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 6.6073126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43540 samples/s/p 1:43:57 } +2024-07-25 23:28:26,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 639/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 6.602392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43604 samples/s/p 1:43:53 } +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 641/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 6.5974746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42926 samples/s/p 1:43:58 } +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 643/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 6.592558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.42933 samples/s/p 1:43:55 } +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 645/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 6.587644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43127 samples/s/p 1:43:50 } +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.5827303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43492 samples/s/p 1:43:43 } +2024-07-25 23:28:41,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 649/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 6.5778186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:41,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.42976 samples/s/p 1:43:46 } +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 651/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 6.5729087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43583 samples/s/p 1:43:36 } +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 653/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 6.5680006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43719 samples/s/p 1:43:32 } +2024-07-25 23:28:50,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 655/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 6.5630943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:50,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43887 samples/s/p 1:43:27 } +2024-07-25 23:28:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 657/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 6.5581894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:53,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43678 samples/s/p 1:43:26 } +2024-07-25 23:28:56,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 659/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 6.5532854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:56,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43619 samples/s/p 1:43:24 } +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 661/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 6.548384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43218 samples/s/p 1:43:25 } +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 663/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 6.543484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.42969 samples/s/p 1:43:25 } +2024-07-25 23:29:05,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 665/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 6.538586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:05,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43424 samples/s/p 1:43:17 } +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 667/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.533689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43166 samples/s/p 1:43:17 } +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 669/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 6.5287973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43629 samples/s/p 1:43:09 } +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 671/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 6.5239014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:14,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43426 samples/s/p 1:43:08 } +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 673/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 6.5190097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43182 samples/s/p 1:43:08 } +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 675/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 6.514122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43497 samples/s/p 1:43:02 } +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 677/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.5092313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43692 samples/s/p 1:42:57 } +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 679/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.5043446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43665 samples/s/p 1:42:54 } +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 681/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 6.4994624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43361 samples/s/p 1:42:54 } +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 683/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 6.4945793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44187 samples/s/p 1:42:42 } +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 685/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 6.489697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43136 samples/s/p 1:42:51 } +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 687/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 6.4848173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43265 samples/s/p 1:42:47 } +2024-07-25 23:29:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 689/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 6.4799387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44106 samples/s/p 1:42:34 } +2024-07-25 23:29:43,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 691/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 6.4750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:43,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44028 samples/s/p 1:42:32 } +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 693/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 6.470187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44199 samples/s/p 1:42:27 } +2024-07-25 23:29:49,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 695/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 6.4653136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:49,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43446 samples/s/p 1:42:33 } +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 697/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 6.4604415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:52,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42762 samples/s/p 1:42:38 } +2024-07-25 23:29:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 699/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.4555716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43499 samples/s/p 1:42:26 } +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 701/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.450704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43501 samples/s/p 1:42:23 } +2024-07-25 23:30:01,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 703/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 6.4458363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:01,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42905 samples/s/p 1:42:27 } +2024-07-25 23:30:04,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 705/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 6.4409714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42786 samples/s/p 1:42:26 } +2024-07-25 23:30:07,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 707/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.4361084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:07,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42841 samples/s/p 1:42:22 } +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 709/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 6.4312467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43728 samples/s/p 1:42:09 } +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 711/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 6.426387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.44091 samples/s/p 1:42:02 } +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 713/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.4215315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43631 samples/s/p 1:42:04 } +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 715/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 6.4166716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:19,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43402 samples/s/p 1:42:04 } +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 717/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.4118162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43528 samples/s/p 1:42:00 } +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 719/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.406966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43372 samples/s/p 1:41:58 } +2024-07-25 23:30:27,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 721/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 6.4021115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:27,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43001 samples/s/p 1:42:00 } +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 723/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 6.397261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43439 samples/s/p 1:41:52 } +2024-07-25 23:30:33,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 725/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.3924163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:33,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43528 samples/s/p 1:41:48 } +2024-07-25 23:30:36,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 727/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 6.387567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:36,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43104 samples/s/p 1:41:50 } +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 729/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.382725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43351 samples/s/p 1:41:44 } +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 731/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.3778816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43106 samples/s/p 1:41:44 } +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 733/ 1625], loss: 1.059, per_step_time: 1469ms, lr: 6.373039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.44373 samples/s/p 1:41:26 } +2024-07-25 23:30:48,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 735/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 6.3682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:48,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43647 samples/s/p 1:41:32 } +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 737/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 6.363362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43672 samples/s/p 1:41:28 } +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 739/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 6.358525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43683 samples/s/p 1:41:25 } +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 741/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.353691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43800 samples/s/p 1:41:21 } +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 743/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 6.348857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43517 samples/s/p 1:41:21 } +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 745/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 6.3440257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43692 samples/s/p 1:41:16 } +2024-07-25 23:31:06,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 747/ 1625], loss: 1.055, per_step_time: 1470ms, lr: 6.3391963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:06,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43886 samples/s/p 1:41:11 } +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 749/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.334368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43805 samples/s/p 1:41:09 } +2024-07-25 23:31:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 751/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 6.3295415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:12,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43716 samples/s/p 1:41:07 } +2024-07-25 23:31:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 753/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 6.324717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43492 samples/s/p 1:41:07 } +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 755/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 6.3198936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43426 samples/s/p 1:41:05 } +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 757/ 1625], loss: 1.036, per_step_time: 1470ms, lr: 6.3150756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43939 samples/s/p 1:40:56 } +2024-07-25 23:31:23,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 759/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 6.3102534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:23,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43598 samples/s/p 1:40:57 } +2024-07-25 23:31:26,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 761/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.3054354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:26,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43874 samples/s/p 1:40:51 } +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 763/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 6.3006214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43361 samples/s/p 1:40:54 } +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 765/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 6.295804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43300 samples/s/p 1:40:51 } +2024-07-25 23:31:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 767/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.2909953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:35,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43736 samples/s/p 1:40:44 } +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 769/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 6.2861827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.42232 samples/s/p 1:40:57 } +2024-07-25 23:31:41,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 771/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 6.2813715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:41,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43558 samples/s/p 1:40:40 } +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 773/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.276566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43619 samples/s/p 1:40:36 } +2024-07-25 23:31:47,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 775/ 1625], loss: 0.939, per_step_time: 1470ms, lr: 6.27176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:47,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44027 samples/s/p 1:40:29 } +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 777/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 6.2669537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:50,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43497 samples/s/p 1:40:32 } +2024-07-25 23:31:53,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 779/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.262154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:53,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43241 samples/s/p 1:40:31 } +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 781/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 6.2573527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43431 samples/s/p 1:40:26 } +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 783/ 1625], loss: 1.039, per_step_time: 1468ms, lr: 6.2525532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44670 samples/s/p 1:40:10 } +2024-07-25 23:32:02,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 785/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 6.2477557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:02,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43642 samples/s/p 1:40:18 } +2024-07-25 23:32:05,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 787/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 6.24296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43446 samples/s/p 1:40:17 } +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 789/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.238167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43529 samples/s/p 1:40:14 } +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 791/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 6.2333734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43707 samples/s/p 1:40:09 } +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 793/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 6.228583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43312 samples/s/p 1:40:10 } +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 795/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 6.2237973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:17,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43925 samples/s/p 1:40:00 } +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 797/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 6.219008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42996 samples/s/p 1:40:08 } +2024-07-25 23:32:23,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 799/ 1625], loss: 1.374, per_step_time: 1471ms, lr: 6.214222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:23,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43819 samples/s/p 1:39:56 } +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 801/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 6.2094405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.44011 samples/s/p 1:39:51 } +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 803/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 6.2046556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42844 samples/s/p 1:40:00 } +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 805/ 1625], loss: 1.395, per_step_time: 1471ms, lr: 6.1998753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43777 samples/s/p 1:39:47 } +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 807/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 6.1950996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:34,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.42672 samples/s/p 1:39:56 } +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 809/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.19032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43889 samples/s/p 1:39:40 } +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 811/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 6.1855476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43247 samples/s/p 1:39:44 } +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 813/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 6.180774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43680 samples/s/p 1:39:37 } +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 815/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.1759993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43315 samples/s/p 1:39:38 } +2024-07-25 23:32:49,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 817/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 6.1712317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43549 samples/s/p 1:39:32 } +2024-07-25 23:32:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 819/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 6.1664637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43814 samples/s/p 1:39:26 } +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 821/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 6.1616947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43856 samples/s/p 1:39:23 } +2024-07-25 23:32:58,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.1569326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:58,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43711 samples/s/p 1:39:21 } +2024-07-25 23:33:01,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 825/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 6.1521696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43824 samples/s/p 1:39:17 } +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 827/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 6.1474075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43402 samples/s/p 1:39:19 } +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 829/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.142649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43227 samples/s/p 1:39:18 } +2024-07-25 23:33:10,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 831/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 6.13789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43745 samples/s/p 1:39:09 } +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 833/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 6.1331343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:13,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43092 samples/s/p 1:39:14 } +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 835/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.128379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.44114 samples/s/p 1:38:59 } +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 837/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 6.1236265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43556 samples/s/p 1:39:03 } +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 839/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.118878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43555 samples/s/p 1:39:00 } +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 841/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 6.1141263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43033 samples/s/p 1:39:02 } +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 843/ 1625], loss: 0.900, per_step_time: 1471ms, lr: 6.109379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43564 samples/s/p 1:38:54 } +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 845/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 6.1046358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43461 samples/s/p 1:38:52 } +2024-07-25 23:33:33,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 847/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 6.099888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:33,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43160 samples/s/p 1:38:52 } +2024-07-25 23:33:36,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 849/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 6.095147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:36,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43130 samples/s/p 1:38:50 } +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 851/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 6.090408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43522 samples/s/p 1:38:42 } +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 853/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 6.085667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.44181 samples/s/p 1:38:32 } +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 855/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 6.0809325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.44046 samples/s/p 1:38:31 } +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 857/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.076197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43623 samples/s/p 1:38:32 } +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 859/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 6.071461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43847 samples/s/p 1:38:27 } +2024-07-25 23:33:54,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 861/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.0667317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43389 samples/s/p 1:38:29 } +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 863/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 6.0620005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43416 samples/s/p 1:38:26 } +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 865/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 6.0572706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43626 samples/s/p 1:38:21 } +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 867/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 6.0525454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:03,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.44193 samples/s/p 1:38:12 } +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 869/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 6.0478205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43812 samples/s/p 1:38:13 } +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 871/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 6.0430975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:09,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43894 samples/s/p 1:38:09 } +2024-07-25 23:34:12,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 873/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.038376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:12,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43641 samples/s/p 1:38:09 } +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 875/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.033657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:15,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43361 samples/s/p 1:38:09 } +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 877/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 6.028938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43531 samples/s/p 1:38:04 } +2024-07-25 23:34:21,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 879/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 6.024223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:21,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43367 samples/s/p 1:38:03 } +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 881/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 6.019508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43617 samples/s/p 1:37:57 } +2024-07-25 23:34:26,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 883/ 1625], loss: 0.990, per_step_time: 1469ms, lr: 6.0147977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:26,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.44237 samples/s/p 1:37:48 } +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 885/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 6.0100842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.42834 samples/s/p 1:38:00 } +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 887/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 6.005375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42765 samples/s/p 1:37:58 } +2024-07-25 23:34:35,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 889/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.0006705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:35,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43773 samples/s/p 1:37:44 } +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 891/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 5.995962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43013 samples/s/p 1:37:49 } +2024-07-25 23:34:41,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 893/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 5.9912577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:41,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43112 samples/s/p 1:37:45 } +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 895/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 5.986558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43021 samples/s/p 1:37:43 } +2024-07-25 23:34:47,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 897/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 5.9818544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:47,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43593 samples/s/p 1:37:34 } +2024-07-25 23:34:50,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 899/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 5.9771587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:50,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43289 samples/s/p 1:37:34 } +2024-07-25 23:34:53,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 901/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.9724625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:53,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43131 samples/s/p 1:37:33 } +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 903/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 5.9677636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43671 samples/s/p 1:37:24 } +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 905/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 5.963073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:59,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43451 samples/s/p 1:37:24 } +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 907/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 5.958381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43154 samples/s/p 1:37:24 } +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 909/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 5.9536887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43575 samples/s/p 1:37:16 } +2024-07-25 23:35:08,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 911/ 1625], loss: 0.999, per_step_time: 1473ms, lr: 5.9490035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43008 samples/s/p 1:37:20 } +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 913/ 1625], loss: 1.011, per_step_time: 1474ms, lr: 5.944317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.42660 samples/s/p 1:37:20 } +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 915/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 5.9396325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43417 samples/s/p 1:37:09 } +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 917/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 5.93495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.44475 samples/s/p 1:36:55 } +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 919/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 5.930269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43961 samples/s/p 1:36:58 } +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 921/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 5.92559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43375 samples/s/p 1:37:01 } +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 923/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.9209115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43204 samples/s/p 1:37:00 } +2024-07-25 23:35:28,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 925/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.9162358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:28,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43434 samples/s/p 1:36:54 } +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 927/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 5.911562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:31,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43654 samples/s/p 1:36:49 } +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 929/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 5.90689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43361 samples/s/p 1:36:49 } +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 931/ 1625], loss: 0.982, per_step_time: 1473ms, lr: 5.902219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43106 samples/s/p 1:36:49 } +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 933/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 5.897553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.42730 samples/s/p 1:36:50 } +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 935/ 1625], loss: 1.269, per_step_time: 1470ms, lr: 5.8928836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:43,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43910 samples/s/p 1:36:35 } +2024-07-25 23:35:46,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 937/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 5.8882206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:46,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43731 samples/s/p 1:36:34 } +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 939/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 5.883558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43014 samples/s/p 1:36:38 } +2024-07-25 23:35:52,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 941/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 5.8788933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:52,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43161 samples/s/p 1:36:34 } +2024-07-25 23:35:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 943/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.8742357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:55,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43690 samples/s/p 1:36:25 } +2024-07-25 23:35:58,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 945/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 5.8695773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:58,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43246 samples/s/p 1:36:27 } +2024-07-25 23:36:01,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 947/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.8649184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:01,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43598 samples/s/p 1:36:20 } +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 949/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 5.8602677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43419 samples/s/p 1:36:19 } +2024-07-25 23:36:07,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 951/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 5.8556143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:07,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43518 samples/s/p 1:36:15 } +2024-07-25 23:36:10,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 953/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 5.8509636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:10,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43857 samples/s/p 1:36:09 } +2024-07-25 23:36:13,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 955/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.8463143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:13,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43805 samples/s/p 1:36:06 } +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 957/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.8416667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43207 samples/s/p 1:36:10 } +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 959/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 5.8370215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43234 samples/s/p 1:36:06 } +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 961/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 5.8323767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43183 samples/s/p 1:36:04 } +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 963/ 1625], loss: 1.170, per_step_time: 1474ms, lr: 5.8277355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:24,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42606 samples/s/p 1:36:07 } +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 965/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 5.8230953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43054 samples/s/p 1:36:00 } +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 967/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.818457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43335 samples/s/p 1:35:54 } +2024-07-25 23:36:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 969/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 5.8138203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43952 samples/s/p 1:35:44 } +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 971/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 5.809185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:36,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.44028 samples/s/p 1:35:40 } +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 973/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 5.8045516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43719 samples/s/p 1:35:41 } +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 975/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.799921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:42,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43271 samples/s/p 1:35:42 } +2024-07-25 23:36:45,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 977/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 5.795291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:45,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43444 samples/s/p 1:35:38 } +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 979/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 5.790663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43552 samples/s/p 1:35:34 } +2024-07-25 23:36:51,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 981/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 5.78604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:51,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43543 samples/s/p 1:35:31 } +2024-07-25 23:36:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 983/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.7814163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43611 samples/s/p 1:35:27 } +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 985/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 5.7767907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44190 samples/s/p 1:35:18 } +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 987/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 5.7721727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43647 samples/s/p 1:35:21 } +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 989/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 5.7675543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43645 samples/s/p 1:35:18 } +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 991/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.7629345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43648 samples/s/p 1:35:15 } +2024-07-25 23:37:09,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 993/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 5.758322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:09,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43315 samples/s/p 1:35:16 } +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 995/ 1625], loss: 1.058, per_step_time: 1469ms, lr: 5.7537086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44326 samples/s/p 1:35:02 } +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 997/ 1625], loss: 1.046, per_step_time: 1473ms, lr: 5.749097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.42797 samples/s/p 1:35:15 } +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 999/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 5.7444868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43425 samples/s/p 1:35:06 } +2024-07-25 23:37:21,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1001/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 5.7398797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:21,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43968 samples/s/p 1:34:57 } +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1003/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 5.735274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:24,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44102 samples/s/p 1:34:53 } +2024-07-25 23:37:26,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1005/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 5.730669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:26,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43806 samples/s/p 1:34:53 } +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1007/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 5.726067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:29,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43302 samples/s/p 1:34:55 } +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1009/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 5.7214656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.42992 samples/s/p 1:34:55 } +2024-07-25 23:37:35,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1011/ 1625], loss: 1.017, per_step_time: 1469ms, lr: 5.716867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:35,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44259 samples/s/p 1:34:39 } +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1013/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 5.7122697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43588 samples/s/p 1:34:43 } +2024-07-25 23:37:41,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1015/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 5.7076745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:41,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43536 samples/s/p 1:34:41 } +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1017/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 5.7030807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43399 samples/s/p 1:34:39 } +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1019/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 5.698489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43054 samples/s/p 1:34:40 } +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1021/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 5.693899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43680 samples/s/p 1:34:30 } +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1023/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.6893105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43622 samples/s/p 1:34:28 } +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1025/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 5.684727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:56,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43445 samples/s/p 1:34:27 } +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1027/ 1625], loss: 0.913, per_step_time: 1475ms, lr: 5.6801396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:59,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42369 samples/s/p 1:34:35 } +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1029/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 5.675557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42832 samples/s/p 1:34:28 } +2024-07-25 23:38:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1031/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 5.670979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:05,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42656 samples/s/p 1:34:26 } +2024-07-25 23:38:08,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1033/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.6663994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:08,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43788 samples/s/p 1:34:12 } +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1035/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 5.6618196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43633 samples/s/p 1:34:10 } +2024-07-25 23:38:14,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1037/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 5.6572476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:14,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.44071 samples/s/p 1:34:03 } +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1039/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 5.652674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43002 samples/s/p 1:34:11 } +2024-07-25 23:38:20,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1041/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 5.648102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:20,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43880 samples/s/p 1:33:59 } +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1043/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 5.643532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43704 samples/s/p 1:33:58 } +2024-07-25 23:38:25,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1045/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 5.6389636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43619 samples/s/p 1:33:56 } +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1047/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 5.6343974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43564 samples/s/p 1:33:53 } +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1049/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 5.629833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43481 samples/s/p 1:33:51 } +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1051/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.6252698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43345 samples/s/p 1:33:50 } +2024-07-25 23:38:37,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1053/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 5.620709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:37,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43560 samples/s/p 1:33:45 } +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1055/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 5.616151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43774 samples/s/p 1:33:39 } +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1057/ 1625], loss: 0.878, per_step_time: 1473ms, lr: 5.6115937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:43,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43085 samples/s/p 1:33:44 } +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1059/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 5.607038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43591 samples/s/p 1:33:35 } +2024-07-25 23:38:49,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1061/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 5.602484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:49,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43611 samples/s/p 1:33:32 } +2024-07-25 23:38:52,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1063/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 5.597932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:52,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.44057 samples/s/p 1:33:25 } +2024-07-25 23:38:55,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1065/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 5.593383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.44004 samples/s/p 1:33:22 } +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1067/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 5.588834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43283 samples/s/p 1:33:27 } +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1069/ 1625], loss: 1.022, per_step_time: 1476ms, lr: 5.5842916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.41770 samples/s/p 1:33:40 } +2024-07-25 23:39:04,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1071/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.5797436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:04,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43682 samples/s/p 1:33:17 } +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1073/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 5.575201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43058 samples/s/p 1:33:20 } +2024-07-25 23:39:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1075/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 5.570663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43538 samples/s/p 1:33:12 } +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1077/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 5.566121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43969 samples/s/p 1:33:05 } +2024-07-25 23:39:16,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1079/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 5.5615847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:16,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42998 samples/s/p 1:33:12 } +2024-07-25 23:39:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1081/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 5.5570517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:19,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44002 samples/s/p 1:32:59 } +2024-07-25 23:39:22,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1083/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 5.5525184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:22,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43466 samples/s/p 1:33:01 } +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1085/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 5.5479873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44224 samples/s/p 1:32:51 } +2024-07-25 23:39:27,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1087/ 1625], loss: 0.904, per_step_time: 1471ms, lr: 5.5434575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:27,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43676 samples/s/p 1:32:53 } +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1089/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 5.5389296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43795 samples/s/p 1:32:49 } +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1091/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 5.5344026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43763 samples/s/p 1:32:47 } +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1093/ 1625], loss: 1.225, per_step_time: 1473ms, lr: 5.5298788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43087 samples/s/p 1:32:51 } +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1095/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 5.5253563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43696 samples/s/p 1:32:41 } +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1097/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.520836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43742 samples/s/p 1:32:38 } +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1099/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.516317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43364 samples/s/p 1:32:39 } +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1101/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 5.5118003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43064 samples/s/p 1:32:39 } +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1103/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 5.507285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:51,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.42674 samples/s/p 1:32:40 } +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 5.502772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43506 samples/s/p 1:32:29 } +2024-07-25 23:39:57,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1107/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 5.4982634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:57,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43241 samples/s/p 1:32:28 } +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1109/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 5.493752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43347 samples/s/p 1:32:24 } +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 5.489244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43823 samples/s/p 1:32:17 } +2024-07-25 23:40:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1113/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.484741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43317 samples/s/p 1:32:19 } +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1115/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 5.4802344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44129 samples/s/p 1:32:08 } +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1117/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.475732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43824 samples/s/p 1:32:08 } +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1119/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 5.471234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43488 samples/s/p 1:32:08 } +2024-07-25 23:40:18,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1121/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 5.466733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43349 samples/s/p 1:32:07 } +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1123/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.4622396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43510 samples/s/p 1:32:02 } +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1125/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 5.4577445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44018 samples/s/p 1:31:54 } +2024-07-25 23:40:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1127/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 5.4532497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43720 samples/s/p 1:31:54 } +2024-07-25 23:40:29,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1129/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 5.4487605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43389 samples/s/p 1:31:55 } +2024-07-25 23:40:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1473ms, lr: 5.4442717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43047 samples/s/p 1:31:55 } +2024-07-25 23:40:35,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1133/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 5.439784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:35,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43335 samples/s/p 1:31:49 } +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1135/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 5.4352986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43335 samples/s/p 1:31:46 } +2024-07-25 23:40:41,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1137/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 5.430815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43932 samples/s/p 1:31:37 } +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1139/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 5.4263337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43089 samples/s/p 1:31:43 } +2024-07-25 23:40:47,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1141/ 1625], loss: 1.304, per_step_time: 1469ms, lr: 5.4218544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:47,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44303 samples/s/p 1:31:28 } +2024-07-25 23:40:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1143/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.4173765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:50,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43810 samples/s/p 1:31:30 } +2024-07-25 23:40:53,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1145/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.4129005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:53,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43635 samples/s/p 1:31:28 } +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1147/ 1625], loss: 1.098, per_step_time: 1476ms, lr: 5.4084253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.41852 samples/s/p 1:31:44 } +2024-07-25 23:40:59,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1149/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 5.4039533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43461 samples/s/p 1:31:24 } +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1151/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 5.3994845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43085 samples/s/p 1:31:25 } +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1153/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 5.3950143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43680 samples/s/p 1:31:16 } +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1155/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 5.390547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.42905 samples/s/p 1:31:21 } +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1157/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.386085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43450 samples/s/p 1:31:13 } +2024-07-25 23:41:14,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1159/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 5.3816193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43915 samples/s/p 1:31:05 } +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1161/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 5.377158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43935 samples/s/p 1:31:02 } +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1163/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 5.372701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43916 samples/s/p 1:30:59 } +2024-07-25 23:41:23,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1165/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.368241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:23,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43350 samples/s/p 1:31:02 } +2024-07-25 23:41:25,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.363788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:25,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43493 samples/s/p 1:30:58 } +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1169/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.359334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:28,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43751 samples/s/p 1:30:52 } +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1171/ 1625], loss: 1.167, per_step_time: 1470ms, lr: 5.3548797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43956 samples/s/p 1:30:47 } +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1173/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 5.350432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43205 samples/s/p 1:30:52 } +2024-07-25 23:41:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1175/ 1625], loss: 1.012, per_step_time: 1471ms, lr: 5.3459844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43496 samples/s/p 1:30:46 } +2024-07-25 23:41:40,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1177/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 5.341535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:40,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43093 samples/s/p 1:30:47 } +2024-07-25 23:41:43,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1179/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 5.3370936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:43,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43670 samples/s/p 1:30:38 } +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1181/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 5.3326517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43081 samples/s/p 1:30:41 } +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1183/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 5.328211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:49,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.42466 samples/s/p 1:30:44 } +2024-07-25 23:41:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1185/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.323772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:52,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43822 samples/s/p 1:30:28 } +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1187/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.319335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43583 samples/s/p 1:30:27 } +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1189/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 5.3149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43488 samples/s/p 1:30:25 } +2024-07-25 23:42:01,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1191/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.3104673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:01,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43173 samples/s/p 1:30:25 } +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1193/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.306036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43218 samples/s/p 1:30:22 } +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1195/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 5.301609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43488 samples/s/p 1:30:16 } +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1197/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 5.2971795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43698 samples/s/p 1:30:11 } +2024-07-25 23:42:13,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1199/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 5.2927535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:13,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43764 samples/s/p 1:30:08 } +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1201/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 5.288333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43946 samples/s/p 1:30:03 } +2024-07-25 23:42:19,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1203/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 5.2839086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:19,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.42998 samples/s/p 1:30:09 } +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1205/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.2794885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43598 samples/s/p 1:30:01 } +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1207/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 5.275073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43464 samples/s/p 1:29:59 } +2024-07-25 23:42:27,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1209/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 5.270654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43545 samples/s/p 1:29:55 } +2024-07-25 23:42:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1211/ 1625], loss: 0.974, per_step_time: 1474ms, lr: 5.266243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:30,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42387 samples/s/p 1:30:04 } +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1213/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 5.2618298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43739 samples/s/p 1:29:47 } +2024-07-25 23:42:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1215/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.257417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43534 samples/s/p 1:29:46 } +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1217/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 5.253011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:39,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43528 samples/s/p 1:29:44 } +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1219/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 5.248604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43197 samples/s/p 1:29:44 } +2024-07-25 23:42:45,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1221/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 5.244197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42832 samples/s/p 1:29:45 } +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1223/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 5.2397972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43056 samples/s/p 1:29:39 } +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1225/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 5.2353953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42968 samples/s/p 1:29:37 } +2024-07-25 23:42:51,585 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1227/ 1625], loss: 0.972, per_step_time: 1948ms, lr: 5.230997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:27,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 4.10672 samples/s/p 1:58:26 } +2024-07-25 23:43:30,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1229/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 5.226599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42943 samples/s/p 1:29:32 } +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1231/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 5.222204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43431 samples/s/p 1:29:24 } +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1233/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 5.21781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42945 samples/s/p 1:29:26 } +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1235/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 5.2134196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43259 samples/s/p 1:29:20 } +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1237/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 5.20903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43301 samples/s/p 1:29:16 } +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1239/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 5.204644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43729 samples/s/p 1:29:09 } +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1241/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 5.200256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43652 samples/s/p 1:29:07 } +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1243/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 5.1958723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42994 samples/s/p 1:29:11 } +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1245/ 1625], loss: 0.898, per_step_time: 1471ms, lr: 5.1914926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43655 samples/s/p 1:29:01 } +2024-07-25 23:43:56,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1247/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.1871107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:56,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43580 samples/s/p 1:28:59 } +2024-07-25 23:43:59,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1249/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.1827324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:59,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43604 samples/s/p 1:28:56 } +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1251/ 1625], loss: 1.108, per_step_time: 1476ms, lr: 5.178358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.41796 samples/s/p 1:29:11 } +2024-07-25 23:44:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1253/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 5.1739808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43019 samples/s/p 1:28:56 } +2024-07-25 23:44:08,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1255/ 1625], loss: 1.357, per_step_time: 1470ms, lr: 5.169611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:08,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43879 samples/s/p 1:28:44 } +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1257/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 5.1652405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43535 samples/s/p 1:28:45 } +2024-07-25 23:44:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1259/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 5.1608695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43931 samples/s/p 1:28:38 } +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1261/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 5.1565053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43551 samples/s/p 1:28:39 } +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1263/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.1521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43531 samples/s/p 1:28:36 } +2024-07-25 23:44:23,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1265/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 5.147777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:23,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44098 samples/s/p 1:28:27 } +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1267/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 5.143416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.42871 samples/s/p 1:28:36 } +2024-07-25 23:44:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1269/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 5.1390575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44144 samples/s/p 1:28:21 } +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1271/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 5.1346997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43737 samples/s/p 1:28:22 } +2024-07-25 23:44:35,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1273/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 5.1303446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:35,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43576 samples/s/p 1:28:21 } +2024-07-25 23:44:38,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1275/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 5.1259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:38,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43674 samples/s/p 1:28:17 } +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1277/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 5.12164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42845 samples/s/p 1:28:22 } +2024-07-25 23:44:43,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1279/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.1172897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:43,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43394 samples/s/p 1:28:14 } +2024-07-25 23:44:46,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1281/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 5.1129427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:46,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43122 samples/s/p 1:28:13 } +2024-07-25 23:44:49,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1283/ 1625], loss: 0.895, per_step_time: 1471ms, lr: 5.108599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:49,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43840 samples/s/p 1:28:03 } +2024-07-25 23:44:52,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1285/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 5.1042534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:53,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43978 samples/s/p 1:27:59 } +2024-07-25 23:44:56,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1287/ 1625], loss: 1.298, per_step_time: 1475ms, lr: 5.099911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:56,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42368 samples/s/p 1:28:12 } +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1289/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 5.095573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:59,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43362 samples/s/p 1:27:59 } +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1291/ 1625], loss: 1.193, per_step_time: 1475ms, lr: 5.091233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42110 samples/s/p 1:28:08 } +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1293/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.086899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43120 samples/s/p 1:27:56 } +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1295/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 5.082565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.44150 samples/s/p 1:27:43 } +2024-07-25 23:45:11,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1297/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 5.07823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:11,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43223 samples/s/p 1:27:49 } +2024-07-25 23:45:14,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1299/ 1625], loss: 1.252, per_step_time: 1475ms, lr: 5.073902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:14,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.42267 samples/s/p 1:27:55 } +2024-07-25 23:45:17,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1301/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 5.0695744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:17,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43578 samples/s/p 1:27:39 } +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1303/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 5.0652447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43365 samples/s/p 1:27:39 } +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1305/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 5.0609233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:23,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43851 samples/s/p 1:27:31 } +2024-07-25 23:45:25,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1307/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 5.0566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:25,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.44033 samples/s/p 1:27:26 } +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1309/ 1625], loss: 1.139, per_step_time: 1477ms, lr: 5.05228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.41409 samples/s/p 1:27:49 } +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1311/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 5.0479603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43462 samples/s/p 1:27:26 } +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1313/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 5.043644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43133 samples/s/p 1:27:26 } +2024-07-25 23:45:37,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1315/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 5.0393287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:37,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42971 samples/s/p 1:27:25 } +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1317/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 5.035016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43289 samples/s/p 1:27:19 } +2024-07-25 23:45:43,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1319/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 5.030705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:43,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42815 samples/s/p 1:27:20 } +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1321/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 5.0263957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43014 samples/s/p 1:27:15 } +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1323/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.0220883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43793 samples/s/p 1:27:05 } +2024-07-25 23:45:52,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1325/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.017783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:52,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43261 samples/s/p 1:27:07 } +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1327/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 5.01348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:55,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42753 samples/s/p 1:27:09 } +2024-07-25 23:45:58,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1329/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 5.0091776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:58,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42802 samples/s/p 1:27:06 } +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1331/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 5.004879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42844 samples/s/p 1:27:02 } +2024-07-25 23:46:04,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1333/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.000584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:04,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43303 samples/s/p 1:26:55 } +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1335/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 4.9962855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42514 samples/s/p 1:27:00 } +2024-07-25 23:46:10,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1337/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 4.9919945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:10,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43539 samples/s/p 1:26:47 } +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1339/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 4.9877026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:13,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43354 samples/s/p 1:26:46 } +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1341/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 4.9834107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43784 samples/s/p 1:26:39 } +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1343/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 4.9791247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.42934 samples/s/p 1:26:44 } +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1345/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.9748396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43668 samples/s/p 1:26:34 } +2024-07-25 23:46:25,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1347/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 4.9705527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:25,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43544 samples/s/p 1:26:32 } +2024-07-25 23:46:28,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1349/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 4.966273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:28,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43304 samples/s/p 1:26:31 } +2024-07-25 23:46:30,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1351/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 4.961993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:30,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43290 samples/s/p 1:26:29 } +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1353/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 4.957715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43791 samples/s/p 1:26:21 } +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1355/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 4.9534397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43665 samples/s/p 1:26:19 } +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1357/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 4.949165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43096 samples/s/p 1:26:22 } +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1359/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 4.9448927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43889 samples/s/p 1:26:11 } +2024-07-25 23:46:45,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1361/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 4.9406226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:45,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43802 samples/s/p 1:26:09 } +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1363/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 4.936354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:48,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43463 samples/s/p 1:26:09 } +2024-07-25 23:46:51,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1365/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 4.932088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:51,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43986 samples/s/p 1:26:01 } +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1367/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 4.9278233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43188 samples/s/p 1:26:06 } +2024-07-25 23:46:57,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1369/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 4.92356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:57,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43555 samples/s/p 1:26:00 } +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1371/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.919299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43071 samples/s/p 1:26:01 } +2024-07-25 23:47:03,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1373/ 1625], loss: 1.125, per_step_time: 1483ms, lr: 4.915041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.39403 samples/s/p 1:26:33 } +2024-07-25 23:47:06,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1375/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 4.9107844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:06,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43896 samples/s/p 1:25:48 } +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1377/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 4.9065297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43158 samples/s/p 1:25:52 } +2024-07-25 23:47:12,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1379/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 4.9022765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:12,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43233 samples/s/p 1:25:48 } +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1381/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 4.8980287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43807 samples/s/p 1:25:40 } +2024-07-25 23:47:18,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1383/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 4.8937773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:18,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43420 samples/s/p 1:25:40 } +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1385/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 4.8895304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43510 samples/s/p 1:25:36 } +2024-07-25 23:47:24,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1387/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 4.8852876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:24,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.42968 samples/s/p 1:25:39 } +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1389/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 4.881045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43615 samples/s/p 1:25:30 } +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1391/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 4.8768015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:30,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43010 samples/s/p 1:25:32 } +2024-07-25 23:47:32,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1393/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 4.8725647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:32,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43040 samples/s/p 1:25:29 } +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1395/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 4.8683273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.44109 samples/s/p 1:25:16 } +2024-07-25 23:47:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1397/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 4.8640923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:38,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43980 samples/s/p 1:25:14 } +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1399/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.85986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:41,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43163 samples/s/p 1:25:19 } +2024-07-25 23:47:44,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1401/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 4.8556276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:44,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43111 samples/s/p 1:25:17 } +2024-07-25 23:47:47,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1403/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 4.851399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:47,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43257 samples/s/p 1:25:12 } +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1405/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 4.8471716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43458 samples/s/p 1:25:08 } +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1407/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 4.8429465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43248 samples/s/p 1:25:07 } +2024-07-25 23:47:56,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1409/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 4.8387237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:56,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43761 samples/s/p 1:24:59 } +2024-07-25 23:47:59,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1411/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 4.8345014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:59,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43601 samples/s/p 1:24:57 } +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1413/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 4.8302823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43480 samples/s/p 1:24:56 } +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1415/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 4.8260645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:05,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43925 samples/s/p 1:24:48 } +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1417/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.8218494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43368 samples/s/p 1:24:51 } +2024-07-25 23:48:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1419/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 4.817638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:11,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43620 samples/s/p 1:24:45 } +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1421/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 4.8134248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43721 samples/s/p 1:24:42 } +2024-07-25 23:48:17,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1423/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 4.809215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:17,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43613 samples/s/p 1:24:40 } +2024-07-25 23:48:20,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1425/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 4.8050097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43442 samples/s/p 1:24:38 } +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1427/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.8008023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43628 samples/s/p 1:24:34 } +2024-07-25 23:48:26,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1429/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 4.796598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:26,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43440 samples/s/p 1:24:32 } +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1431/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 4.792399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.44084 samples/s/p 1:24:23 } +2024-07-25 23:48:31,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1433/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 4.7881967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:31,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43566 samples/s/p 1:24:25 } +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1435/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 4.7840017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43593 samples/s/p 1:24:22 } +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1437/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 4.7798057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43593 samples/s/p 1:24:19 } +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1439/ 1625], loss: 0.954, per_step_time: 1473ms, lr: 4.775612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42959 samples/s/p 1:24:22 } +2024-07-25 23:48:43,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1441/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 4.7714207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:43,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43195 samples/s/p 1:24:17 } +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1443/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 4.7672306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43073 samples/s/p 1:24:15 } +2024-07-25 23:48:49,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1445/ 1625], loss: 1.288, per_step_time: 1474ms, lr: 4.7630424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:49,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42734 samples/s/p 1:24:15 } +2024-07-25 23:48:52,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1447/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 4.758857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:52,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43731 samples/s/p 1:24:03 } +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1449/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 4.7546737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43025 samples/s/p 1:24:07 } +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1451/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 4.7504914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43055 samples/s/p 1:24:04 } +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1453/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 4.746311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42935 samples/s/p 1:24:02 } +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1455/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 4.742134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43895 samples/s/p 1:23:50 } +2024-07-25 23:49:07,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1457/ 1625], loss: 1.376, per_step_time: 1471ms, lr: 4.737958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:07,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43820 samples/s/p 1:23:48 } +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1459/ 1625], loss: 1.180, per_step_time: 1475ms, lr: 4.7337835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.42198 samples/s/p 1:24:00 } +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1461/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.7296116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43493 samples/s/p 1:23:45 } +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1463/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 4.7254443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43965 samples/s/p 1:23:37 } +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1465/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 4.721274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44063 samples/s/p 1:23:34 } +2024-07-25 23:49:22,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1467/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 4.7171084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:22,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44316 samples/s/p 1:23:28 } +2024-07-25 23:49:25,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1469/ 1625], loss: 1.019, per_step_time: 1469ms, lr: 4.712947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:25,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44378 samples/s/p 1:23:25 } +2024-07-25 23:49:28,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1471/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 4.708782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:28,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43641 samples/s/p 1:23:29 } +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1473/ 1625], loss: 1.039, per_step_time: 1475ms, lr: 4.7046224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42299 samples/s/p 1:23:38 } +2024-07-25 23:49:33,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1475/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 4.700467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:33,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42977 samples/s/p 1:23:29 } +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1477/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.6963078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43169 samples/s/p 1:23:24 } +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1479/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 4.692157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43707 samples/s/p 1:23:16 } +2024-07-25 23:49:42,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1481/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 4.688005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:42,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43202 samples/s/p 1:23:18 } +2024-07-25 23:49:45,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1483/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 4.6838522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:45,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43652 samples/s/p 1:23:11 } +2024-07-25 23:49:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1485/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 4.6797063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:48,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43298 samples/s/p 1:23:11 } +2024-07-25 23:49:51,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1487/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 4.6755604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:51,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.42870 samples/s/p 1:23:12 } +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1489/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 4.6714163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43514 samples/s/p 1:23:03 } +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1491/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 4.667274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43097 samples/s/p 1:23:04 } +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 4.663134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43863 samples/s/p 1:22:54 } +2024-07-25 23:50:03,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1495/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 4.6589967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:03,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43396 samples/s/p 1:22:56 } +2024-07-25 23:50:06,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1497/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 4.6548603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43532 samples/s/p 1:22:51 } +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1499/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 4.6507257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:09,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43707 samples/s/p 1:22:47 } +2024-07-25 23:50:12,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1501/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 4.6465934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:12,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43257 samples/s/p 1:22:48 } +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1503/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.6424643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43417 samples/s/p 1:22:44 } +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1505/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 4.6383366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43421 samples/s/p 1:22:41 } +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1507/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 4.634212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43049 samples/s/p 1:22:41 } +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1509/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 4.630086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43643 samples/s/p 1:22:33 } +2024-07-25 23:50:27,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1511/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 4.6259643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43586 samples/s/p 1:22:30 } +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1513/ 1625], loss: 1.123, per_step_time: 1482ms, lr: 4.621846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:30,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.39746 samples/s/p 1:23:03 } +2024-07-25 23:50:33,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1515/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 4.617726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:33,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43964 samples/s/p 1:22:21 } +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1517/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 4.6136106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43048 samples/s/p 1:22:26 } +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1519/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 4.6094983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:38,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43779 samples/s/p 1:22:17 } +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1521/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 4.6053838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.44157 samples/s/p 1:22:10 } +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1523/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 4.6012765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43003 samples/s/p 1:22:18 } +2024-07-25 23:50:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1525/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 4.5971688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:47,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43235 samples/s/p 1:22:13 } +2024-07-25 23:50:50,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1527/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 4.593061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:50,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43311 samples/s/p 1:22:09 } +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1529/ 1625], loss: 1.167, per_step_time: 1470ms, lr: 4.588959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43901 samples/s/p 1:22:01 } +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1531/ 1625], loss: 1.281, per_step_time: 1474ms, lr: 4.5848574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.42434 samples/s/p 1:22:11 } +2024-07-25 23:50:59,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1533/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 4.5807546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:59,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43902 samples/s/p 1:21:55 } +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1535/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 4.5766587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43638 samples/s/p 1:21:55 } +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1537/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 4.5725637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43440 samples/s/p 1:21:53 } +2024-07-25 23:51:08,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1539/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 4.568469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43696 samples/s/p 1:21:48 } +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1541/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 4.5643774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.44017 samples/s/p 1:21:42 } +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1543/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 4.560288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43674 samples/s/p 1:21:42 } +2024-07-25 23:51:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1545/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 4.5561997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.42815 samples/s/p 1:21:47 } +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1547/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.5521147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43441 samples/s/p 1:21:39 } +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1549/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.548031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43757 samples/s/p 1:21:33 } +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1551/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 4.5439515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43544 samples/s/p 1:21:32 } +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1553/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 4.5398697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43411 samples/s/p 1:21:30 } +2024-07-25 23:51:32,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1555/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 4.535792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:32,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43738 samples/s/p 1:21:24 } +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1557/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 4.531719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43253 samples/s/p 1:21:26 } +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1559/ 1625], loss: 1.250, per_step_time: 1469ms, lr: 4.527643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.44391 samples/s/p 1:21:12 } +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1561/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 4.523571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43882 samples/s/p 1:21:14 } +2024-07-25 23:51:43,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1563/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.519503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:43,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43194 samples/s/p 1:21:17 } +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1565/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 4.5154343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:46,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.42997 samples/s/p 1:21:16 } +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1567/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 4.51137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43719 samples/s/p 1:21:07 } +2024-07-25 23:51:52,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1569/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 4.5073075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44433 samples/s/p 1:20:57 } +2024-07-25 23:51:55,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1571/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 4.503243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:55,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43833 samples/s/p 1:21:00 } +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1573/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.4991866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43460 samples/s/p 1:21:00 } +2024-07-25 23:52:01,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1575/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 4.495129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44001 samples/s/p 1:20:52 } +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1577/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 4.491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43558 samples/s/p 1:20:53 } +2024-07-25 23:52:07,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1579/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 4.4870203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:07,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44064 samples/s/p 1:20:46 } +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1581/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 4.482969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43581 samples/s/p 1:20:47 } +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1583/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 4.47892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.42964 samples/s/p 1:20:50 } +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1585/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 4.474872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43581 samples/s/p 1:20:41 } +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1587/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 4.4708277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43318 samples/s/p 1:20:41 } +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1589/ 1625], loss: 1.270, per_step_time: 1474ms, lr: 4.4667863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42569 samples/s/p 1:20:45 } +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1591/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.4627423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43254 samples/s/p 1:20:36 } +2024-07-25 23:52:28,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1593/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 4.4587036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:28,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43077 samples/s/p 1:20:34 } +2024-07-25 23:52:31,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.454668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:31,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43248 samples/s/p 1:20:30 } +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1597/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 4.4506323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43860 samples/s/p 1:20:21 } +2024-07-25 23:52:36,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1599/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 4.4465987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:36,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43280 samples/s/p 1:20:24 } +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1601/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 4.4425697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43088 samples/s/p 1:20:22 } +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1603/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 4.4385383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.42870 samples/s/p 1:20:21 } +2024-07-25 23:52:45,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1605/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 4.4345143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:45,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43442 samples/s/p 1:20:13 } +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1607/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 4.4304898e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43897 samples/s/p 1:20:06 } +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1609/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 4.426465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43522 samples/s/p 1:20:07 } +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1611/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.4224466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43285 samples/s/p 1:20:06 } +2024-07-25 23:52:57,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1613/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 4.418427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:57,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43735 samples/s/p 1:19:59 } +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1615/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 4.414409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43875 samples/s/p 1:19:55 } +2024-07-25 23:53:03,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1617/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 4.4103963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:03,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43215 samples/s/p 1:19:58 } +2024-07-25 23:53:06,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1619/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 4.4063836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:06,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43813 samples/s/p 1:19:49 } +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1621/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.402373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43512 samples/s/p 1:19:49 } +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1623/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.3983646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43323 samples/s/p 1:19:48 } +2024-07-25 23:53:15,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1625/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 4.394358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:15,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43479 samples/s/p 1:19:43 } +2024-07-25 23:53:18,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 2/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 4.3903538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42754 samples/s/p 1:19:47 } +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 4/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 4.3863524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43262 samples/s/p 1:19:40 } +2024-07-25 23:53:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 6/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 4.3823516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:24,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42741 samples/s/p 1:19:41 } +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 8/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 4.3783525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43562 samples/s/p 1:19:31 } +2024-07-25 23:53:30,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 10/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.374357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:30,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43802 samples/s/p 1:19:26 } +2024-07-25 23:53:33,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 12/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.3703635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:33,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43424 samples/s/p 1:19:26 } +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 14/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 4.366374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43613 samples/s/p 1:19:22 } +2024-07-25 23:53:38,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 16/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 4.362382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:38,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43216 samples/s/p 1:19:22 } +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 18/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 4.358393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43745 samples/s/p 1:19:15 } +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 20/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 4.35441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:44,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43402 samples/s/p 1:19:15 } +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 22/ 1625], loss: 1.292, per_step_time: 1475ms, lr: 4.350423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42301 samples/s/p 1:19:21 } +2024-07-25 23:53:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 24/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 4.3464447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:50,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42895 samples/s/p 1:19:13 } +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 26/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 4.342464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43520 samples/s/p 1:19:05 } +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 28/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 4.338484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43959 samples/s/p 1:18:58 } +2024-07-25 23:53:59,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 30/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 4.334511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:59,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43729 samples/s/p 1:18:57 } +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 32/ 1625], loss: 1.037, per_step_time: 1469ms, lr: 4.330538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.44309 samples/s/p 1:18:49 } +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 34/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 4.326564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43562 samples/s/p 1:18:53 } +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 36/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 4.3225964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42785 samples/s/p 1:18:57 } +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 38/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 4.318629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42589 samples/s/p 1:18:55 } +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 40/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 4.3146647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:14,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43600 samples/s/p 1:18:44 } +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 42/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 4.310701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:17,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43849 samples/s/p 1:18:38 } +2024-07-25 23:54:20,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 44/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 4.3067403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43552 samples/s/p 1:18:38 } +2024-07-25 23:54:23,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 46/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 4.3027812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:23,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.42734 samples/s/p 1:18:42 } +2024-07-25 23:54:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 48/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 4.2988236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43568 samples/s/p 1:18:32 } +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 50/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 4.2948686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43173 samples/s/p 1:18:33 } +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 52/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 4.2909155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.44014 samples/s/p 1:18:22 } +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 54/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 4.286965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.44089 samples/s/p 1:18:19 } +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 56/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 4.283017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43505 samples/s/p 1:18:21 } +2024-07-25 23:54:40,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 58/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 4.2790707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:40,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43344 samples/s/p 1:18:19 } +2024-07-25 23:54:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 60/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 4.2751253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43343 samples/s/p 1:18:16 } +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 62/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 4.2711836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43885 samples/s/p 1:18:09 } +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 64/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 4.267245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.44037 samples/s/p 1:18:04 } +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 66/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 4.263304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43265 samples/s/p 1:18:08 } +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 68/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 4.2593706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43144 samples/s/p 1:18:06 } +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 70/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 4.2554357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43033 samples/s/p 1:18:04 } +2024-07-25 23:55:01,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 72/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 4.2515017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:01,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43375 samples/s/p 1:17:58 } +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 74/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 4.2475735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:04,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43694 samples/s/p 1:17:53 } +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 76/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 4.2436454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43998 samples/s/p 1:17:47 } +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 78/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 4.2397182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43860 samples/s/p 1:17:45 } +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 80/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 4.235796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43509 samples/s/p 1:17:45 } +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 82/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 4.231874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43784 samples/s/p 1:17:40 } +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 84/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.2279544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42852 samples/s/p 1:17:45 } +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 86/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 4.2240367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:22,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43316 samples/s/p 1:17:38 } +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 88/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 4.220122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43531 samples/s/p 1:17:34 } +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 90/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 4.2162083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:28,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43163 samples/s/p 1:17:34 } +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 92/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 4.2122965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43197 samples/s/p 1:17:30 } +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 94/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 4.2083875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43486 samples/s/p 1:17:25 } +2024-07-25 23:55:36,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 96/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 4.2044812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:36,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43579 samples/s/p 1:17:21 } +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 98/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.2005754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43542 samples/s/p 1:17:19 } +2024-07-25 23:55:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 100/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 4.1966723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:42,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43807 samples/s/p 1:17:13 } +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 102/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 4.192771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43374 samples/s/p 1:17:14 } +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 104/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 4.1888734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:48,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43208 samples/s/p 1:17:13 } +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 106/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.1849753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:51,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43694 samples/s/p 1:17:06 } +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 108/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.181081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:54,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43327 samples/s/p 1:17:06 } +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 110/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 4.177189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:57,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43288 samples/s/p 1:17:03 } +2024-07-25 23:56:00,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 112/ 1625], loss: 1.520, per_step_time: 1472ms, lr: 4.1733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:00,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43155 samples/s/p 1:17:01 } +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 114/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 4.1694116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43515 samples/s/p 1:16:55 } +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 116/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 4.1655235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.44039 samples/s/p 1:16:48 } +2024-07-25 23:56:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 118/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 4.1616418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:09,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43839 samples/s/p 1:16:47 } +2024-07-25 23:56:12,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 120/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 4.1577587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:12,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43082 samples/s/p 1:16:50 } +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 122/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 4.15388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44461 samples/s/p 1:16:36 } +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 124/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 4.150001e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42995 samples/s/p 1:16:45 } +2024-07-25 23:56:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 126/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 4.146126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:21,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43545 samples/s/p 1:16:37 } +2024-07-25 23:56:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 128/ 1625], loss: 0.937, per_step_time: 1474ms, lr: 4.1422522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:24,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42710 samples/s/p 1:16:42 } +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 130/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 4.13838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:27,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44055 samples/s/p 1:16:27 } +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 132/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 4.134511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43751 samples/s/p 1:16:27 } +2024-07-25 23:56:33,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 134/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 4.1306434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:33,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44058 samples/s/p 1:16:21 } +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 136/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.126778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43635 samples/s/p 1:16:22 } +2024-07-25 23:56:38,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 138/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 4.122915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:38,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42947 samples/s/p 1:16:25 } +2024-07-25 23:56:41,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 140/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 4.1190533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:41,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43955 samples/s/p 1:16:13 } +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 142/ 1625], loss: 1.094, per_step_time: 1478ms, lr: 4.1151943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.41186 samples/s/p 1:16:34 } +2024-07-25 23:56:47,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 144/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.111337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:47,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43773 samples/s/p 1:16:09 } +2024-07-25 23:56:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 146/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 4.1074827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43019 samples/s/p 1:16:12 } +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 148/ 1625], loss: 1.280, per_step_time: 1476ms, lr: 4.1036305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.42002 samples/s/p 1:16:18 } +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 150/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.099782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43497 samples/s/p 1:16:03 } +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 152/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 4.0959317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43890 samples/s/p 1:15:56 } +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 154/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 4.092085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43057 samples/s/p 1:16:00 } +2024-07-25 23:57:05,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 156/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 4.0882423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:05,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43426 samples/s/p 1:15:54 } +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 158/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 4.084398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43946 samples/s/p 1:15:47 } +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 160/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 4.080558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43090 samples/s/p 1:15:51 } +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 162/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 4.076722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43637 samples/s/p 1:15:44 } +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 164/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 4.072886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:17,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43374 samples/s/p 1:15:43 } +2024-07-25 23:57:20,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 166/ 1625], loss: 0.903, per_step_time: 1471ms, lr: 4.069052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43795 samples/s/p 1:15:37 } +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 168/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.0652208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43640 samples/s/p 1:15:35 } +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 170/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 4.0613913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:26,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43565 samples/s/p 1:15:33 } +2024-07-25 23:57:29,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 172/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.0575633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:29,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43638 samples/s/p 1:15:29 } +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 174/ 1625], loss: 1.329, per_step_time: 1482ms, lr: 4.0537384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.39594 samples/s/p 1:16:00 } +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 176/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 4.0499153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.44168 samples/s/p 1:15:19 } +2024-07-25 23:57:38,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 178/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 4.0460936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:38,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43779 samples/s/p 1:15:19 } +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 180/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 4.0422756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43529 samples/s/p 1:15:18 } +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 182/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 4.038459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43636 samples/s/p 1:15:14 } +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 184/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 4.034644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43319 samples/s/p 1:15:14 } +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 186/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 4.030831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:49,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43364 samples/s/p 1:15:11 } +2024-07-25 23:57:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 188/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 4.027021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43968 samples/s/p 1:15:03 } +2024-07-25 23:57:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 190/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.023212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:55,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43503 samples/s/p 1:15:04 } +2024-07-25 23:57:58,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 192/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 4.019406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:58,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.42160 samples/s/p 1:15:12 } +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 194/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 4.015604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43273 samples/s/p 1:15:00 } +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 196/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 4.0118007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43835 samples/s/p 1:14:52 } +2024-07-25 23:58:07,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 198/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.0080004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:07,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43629 samples/s/p 1:14:51 } +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 200/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.0042046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43616 samples/s/p 1:14:48 } +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 202/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.000406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43723 samples/s/p 1:14:44 } +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 204/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.9966126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43444 samples/s/p 1:14:43 } +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 206/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 3.9928236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43987 samples/s/p 1:14:36 } +2024-07-25 23:58:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 208/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 3.9890315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43368 samples/s/p 1:14:38 } +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 210/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 3.9852466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43445 samples/s/p 1:14:35 } +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 212/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 3.9814613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43379 samples/s/p 1:14:32 } +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 214/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 3.977679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43899 samples/s/p 1:14:25 } +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 216/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 3.973899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43876 samples/s/p 1:14:22 } +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 218/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 3.9701185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43266 samples/s/p 1:14:24 } +2024-07-25 23:58:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 220/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 3.9663437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:39,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43510 samples/s/p 1:14:19 } +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 222/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 3.9625684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43574 samples/s/p 1:14:16 } +2024-07-25 23:58:45,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 224/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.958796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:45,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43650 samples/s/p 1:14:12 } +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 226/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 3.955026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43954 samples/s/p 1:14:07 } +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 228/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 3.951258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43611 samples/s/p 1:14:07 } +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 230/ 1625], loss: 1.118, per_step_time: 1469ms, lr: 3.947492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44246 samples/s/p 1:13:59 } +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 232/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 3.943728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44125 samples/s/p 1:13:57 } +2024-07-25 23:59:00,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 234/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 3.939966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:00,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44334 samples/s/p 1:13:52 } +2024-07-25 23:59:03,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 236/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.936207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:03,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.44085 samples/s/p 1:13:51 } +2024-07-25 23:59:06,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 238/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 3.9324523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:06,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43427 samples/s/p 1:13:54 } +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 240/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.928695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43393 samples/s/p 1:13:51 } +2024-07-25 23:59:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 242/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 3.9249417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43331 samples/s/p 1:13:48 } +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 244/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 3.9211923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43807 samples/s/p 1:13:42 } +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 246/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 3.9174415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43060 samples/s/p 1:13:45 } +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 248/ 1625], loss: 1.137, per_step_time: 1482ms, lr: 3.913695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.39798 samples/s/p 1:14:09 } +2024-07-25 23:59:24,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 250/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 3.9099527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:24,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.42776 samples/s/p 1:13:41 } +2024-07-25 23:59:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 252/ 1625], loss: 1.115, per_step_time: 1467ms, lr: 3.906208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:27,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.45044 samples/s/p 1:13:20 } +2024-07-25 23:59:30,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 254/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.90247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:30,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43633 samples/s/p 1:13:28 } +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 256/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 3.898732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43810 samples/s/p 1:13:24 } +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 258/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 3.894994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43475 samples/s/p 1:13:24 } +2024-07-25 23:59:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 260/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 3.891262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43918 samples/s/p 1:13:17 } +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 262/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.88753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:41,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43676 samples/s/p 1:13:16 } +2024-07-25 23:59:44,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 264/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 3.8838007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43458 samples/s/p 1:13:15 } +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 266/ 1625], loss: 0.961, per_step_time: 1471ms, lr: 3.880073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43780 samples/s/p 1:13:10 } +2024-07-25 23:59:50,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 268/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.8763483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:50,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43199 samples/s/p 1:13:11 } +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 270/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 3.872625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43756 samples/s/p 1:13:04 } +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 272/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 3.868904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43076 samples/s/p 1:13:06 } +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 274/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 3.865185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43450 samples/s/p 1:13:00 } +2024-07-26 00:00:02,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 276/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 3.861469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:02,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43052 samples/s/p 1:13:01 } +2024-07-26 00:00:05,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 278/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 3.8577537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:05,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.44111 samples/s/p 1:12:49 } +2024-07-26 00:00:08,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 280/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 3.8540416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:08,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43699 samples/s/p 1:12:50 } +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 282/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.8503335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:11,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43877 samples/s/p 1:12:45 } +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 284/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.8466233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.42999 samples/s/p 1:12:49 } +2024-07-26 00:00:17,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 286/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 3.8429175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:17,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43326 samples/s/p 1:12:44 } +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 288/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 3.839216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43079 samples/s/p 1:12:43 } +2024-07-26 00:00:23,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 290/ 1625], loss: 0.970, per_step_time: 1473ms, lr: 3.8355124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:23,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43014 samples/s/p 1:12:40 } +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 292/ 1625], loss: 1.233, per_step_time: 1469ms, lr: 3.8318144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.44274 samples/s/p 1:12:27 } +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 294/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 3.828117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43114 samples/s/p 1:12:34 } +2024-07-26 00:00:32,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 296/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 3.8244198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43157 samples/s/p 1:12:30 } +2024-07-26 00:00:35,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 298/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 3.820728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:35,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43722 samples/s/p 1:12:23 } +2024-07-26 00:00:38,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 300/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 3.817038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:38,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43444 samples/s/p 1:12:22 } +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 302/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 3.8133467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43596 samples/s/p 1:12:18 } +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 304/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 3.8096632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43302 samples/s/p 1:12:17 } +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 306/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 3.8059788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42199 samples/s/p 1:12:23 } +2024-07-26 00:00:49,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 308/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 3.802295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:49,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43462 samples/s/p 1:12:10 } +2024-07-26 00:00:52,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 310/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 3.798616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:52,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43495 samples/s/p 1:12:07 } +2024-07-26 00:00:55,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 312/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 3.7949385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:55,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42193 samples/s/p 1:12:14 } +2024-07-26 00:00:58,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 314/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.7912619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:58,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43051 samples/s/p 1:12:05 } +2024-07-26 00:01:01,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 316/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 3.7875889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:01,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43478 samples/s/p 1:11:58 } +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 318/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 3.7839172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:04,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43103 samples/s/p 1:11:58 } +2024-07-26 00:01:07,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 320/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 3.7802492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:07,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.44031 samples/s/p 1:11:48 } +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.7765808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43955 samples/s/p 1:11:46 } +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 324/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.772916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:13,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43535 samples/s/p 1:11:46 } +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 326/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 3.7692557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:16,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.44030 samples/s/p 1:11:39 } +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 328/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 3.7655932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:19,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43471 samples/s/p 1:11:41 } +2024-07-26 00:01:22,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 3.7619338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.44033 samples/s/p 1:11:33 } +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 332/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 3.75828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43202 samples/s/p 1:11:37 } +2024-07-26 00:01:28,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 334/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 3.7546238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:28,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44098 samples/s/p 1:11:27 } +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 336/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 3.750974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44020 samples/s/p 1:11:25 } +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 338/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 3.7473242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43437 samples/s/p 1:11:26 } +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 340/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 3.7436744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43452 samples/s/p 1:11:23 } +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 342/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 3.740031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43546 samples/s/p 1:11:20 } +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 344/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 3.736388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43041 samples/s/p 1:11:21 } +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 346/ 1625], loss: 0.863, per_step_time: 1471ms, lr: 3.732745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43567 samples/s/p 1:11:13 } +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 348/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.7291084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:48,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43724 samples/s/p 1:11:09 } +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 3.7254713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43008 samples/s/p 1:11:12 } +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 352/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.721836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43621 samples/s/p 1:11:04 } +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 354/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 3.7182035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43156 samples/s/p 1:11:05 } +2024-07-26 00:02:00,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 356/ 1625], loss: 1.363, per_step_time: 1475ms, lr: 3.7145737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:00,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42264 samples/s/p 1:11:09 } +2024-07-26 00:02:03,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 358/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 3.7109462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42684 samples/s/p 1:11:03 } +2024-07-26 00:02:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 360/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 3.70732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43851 samples/s/p 1:10:51 } +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 362/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 3.7036962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43612 samples/s/p 1:10:50 } +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 364/ 1625], loss: 1.313, per_step_time: 1474ms, lr: 3.7000773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42466 samples/s/p 1:10:56 } +2024-07-26 00:02:15,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 366/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 3.6964552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:15,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43712 samples/s/p 1:10:43 } +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 368/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 3.6928382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43373 samples/s/p 1:10:43 } +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 370/ 1625], loss: 1.399, per_step_time: 1473ms, lr: 3.6892257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42744 samples/s/p 1:10:45 } +2024-07-26 00:02:24,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 372/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 3.6856104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:24,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42829 samples/s/p 1:10:41 } +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 374/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6819997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43589 samples/s/p 1:10:32 } +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 376/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 3.678394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43150 samples/s/p 1:10:33 } +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 378/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 3.6747856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42860 samples/s/p 1:10:32 } +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 380/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 3.671183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42612 samples/s/p 1:10:31 } +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 382/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 3.667582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43333 samples/s/p 1:10:22 } +2024-07-26 00:02:41,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 384/ 1625], loss: 1.105, per_step_time: 1474ms, lr: 3.6639794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42444 samples/s/p 1:10:26 } +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 386/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 3.6603833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43357 samples/s/p 1:10:16 } +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 388/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.656788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43323 samples/s/p 1:10:14 } +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 390/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6531942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:50,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43050 samples/s/p 1:10:13 } +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 392/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 3.6496049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:53,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43702 samples/s/p 1:10:05 } +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 394/ 1625], loss: 0.928, per_step_time: 1473ms, lr: 3.6460156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42821 samples/s/p 1:10:09 } +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 396/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 3.642429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:59,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43470 samples/s/p 1:10:01 } +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 398/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 3.638845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43716 samples/s/p 1:09:56 } +2024-07-26 00:03:05,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 400/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6352626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:05,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43714 samples/s/p 1:09:53 } +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 402/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 3.6316828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43238 samples/s/p 1:09:54 } +2024-07-26 00:03:11,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 404/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 3.6281049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:11,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43427 samples/s/p 1:09:49 } +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 406/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 3.6245292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43129 samples/s/p 1:09:49 } +2024-07-26 00:03:17,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 408/ 1625], loss: 1.059, per_step_time: 1473ms, lr: 3.6209553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:17,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43094 samples/s/p 1:09:46 } +2024-07-26 00:03:20,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 410/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6173842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:20,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.42897 samples/s/p 1:09:44 } +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 412/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 3.613815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43200 samples/s/p 1:09:39 } +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 414/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 3.6102506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43270 samples/s/p 1:09:36 } +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 416/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.606684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:29,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43250 samples/s/p 1:09:33 } +2024-07-26 00:03:32,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 418/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 3.6031215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:32,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43252 samples/s/p 1:09:30 } +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 420/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.5995631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43427 samples/s/p 1:09:26 } +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 422/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 3.5960024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:38,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43609 samples/s/p 1:09:21 } +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 424/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.5924495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43374 samples/s/p 1:09:20 } +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 426/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.5888947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:43,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43090 samples/s/p 1:09:19 } +2024-07-26 00:03:46,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 428/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.5853418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:46,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43718 samples/s/p 1:09:12 } +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 430/ 1625], loss: 1.095, per_step_time: 1473ms, lr: 3.5817948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:49,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43054 samples/s/p 1:09:14 } +2024-07-26 00:03:52,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 432/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 3.5782468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:52,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43815 samples/s/p 1:09:05 } +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 434/ 1625], loss: 1.134, per_step_time: 1473ms, lr: 3.5747025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43009 samples/s/p 1:09:08 } +2024-07-26 00:03:58,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 436/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.57116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:58,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43411 samples/s/p 1:09:02 } +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 438/ 1625], loss: 1.138, per_step_time: 1474ms, lr: 3.567619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42606 samples/s/p 1:09:05 } +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 440/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 3.5640805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43826 samples/s/p 1:08:53 } +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 442/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 3.5605449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:07,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43123 samples/s/p 1:08:56 } +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 444/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.557011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43398 samples/s/p 1:08:51 } +2024-07-26 00:04:13,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 446/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 3.5534795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:13,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43160 samples/s/p 1:08:49 } +2024-07-26 00:04:16,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 448/ 1625], loss: 1.162, per_step_time: 1485ms, lr: 3.5499497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:16,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.38446 samples/s/p 1:09:23 } +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 450/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 3.5464218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43563 samples/s/p 1:08:40 } +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 452/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.5428975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43476 samples/s/p 1:08:38 } +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 454/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 3.5393746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43656 samples/s/p 1:08:34 } +2024-07-26 00:04:28,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 456/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.5358544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:28,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43681 samples/s/p 1:08:31 } +2024-07-26 00:04:31,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.532336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:31,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43437 samples/s/p 1:08:30 } +2024-07-26 00:04:34,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 460/ 1625], loss: 1.344, per_step_time: 1476ms, lr: 3.5288194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:34,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.41840 samples/s/p 1:08:39 } +2024-07-26 00:04:37,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 462/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 3.525307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43356 samples/s/p 1:08:24 } +2024-07-26 00:04:40,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 464/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.5217954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:40,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43304 samples/s/p 1:08:22 } +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 466/ 1625], loss: 1.228, per_step_time: 1474ms, lr: 3.5182838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.42385 samples/s/p 1:08:26 } +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 468/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.5147787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43818 samples/s/p 1:08:12 } +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 3.511273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43867 samples/s/p 1:08:09 } +2024-07-26 00:04:51,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 472/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 3.5077683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:51,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44277 samples/s/p 1:08:03 } +2024-07-26 00:04:54,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 474/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 3.50427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:54,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44390 samples/s/p 1:07:59 } +2024-07-26 00:04:57,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 476/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 3.5007715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:57,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43964 samples/s/p 1:07:59 } +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 478/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 3.4972754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.42975 samples/s/p 1:08:04 } +2024-07-26 00:05:03,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 480/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 3.4937802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:03,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43555 samples/s/p 1:07:56 } +2024-07-26 00:05:06,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 482/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 3.4902887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:06,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43979 samples/s/p 1:07:50 } +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 484/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 3.4867994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43993 samples/s/p 1:07:47 } +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 486/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.4833124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43566 samples/s/p 1:07:47 } +2024-07-26 00:05:15,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 488/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 3.4798268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:15,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43326 samples/s/p 1:07:46 } +2024-07-26 00:05:18,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 490/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 3.4763439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:18,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43499 samples/s/p 1:07:42 } +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 492/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 3.4728632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43028 samples/s/p 1:07:43 } +2024-07-26 00:05:24,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 494/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 3.4693844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:24,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43729 samples/s/p 1:07:34 } +2024-07-26 00:05:27,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 496/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 3.4659074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:27,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43470 samples/s/p 1:07:33 } +2024-07-26 00:05:30,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 498/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 3.4624331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:30,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43152 samples/s/p 1:07:33 } +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 500/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 3.4589616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.44056 samples/s/p 1:07:23 } +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 502/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 3.4554914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43061 samples/s/p 1:07:28 } +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 504/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 3.452024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42664 samples/s/p 1:07:28 } +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 506/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 3.448562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43607 samples/s/p 1:07:18 } +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 508/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 3.4450968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42876 samples/s/p 1:07:20 } +2024-07-26 00:05:47,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 510/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 3.4416348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:47,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43218 samples/s/p 1:07:15 } +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 512/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 3.4381792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42960 samples/s/p 1:07:14 } +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 514/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 3.4347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43424 samples/s/p 1:07:07 } +2024-07-26 00:05:56,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 516/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 3.431267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42489 samples/s/p 1:07:11 } +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 518/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 3.4278169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42809 samples/s/p 1:07:06 } +2024-07-26 00:06:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 520/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 3.4243667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:02,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43393 samples/s/p 1:06:59 } +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 522/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 3.4209197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:05,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43516 samples/s/p 1:06:55 } +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 524/ 1625], loss: 0.867, per_step_time: 1471ms, lr: 3.417474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43555 samples/s/p 1:06:52 } +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 526/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.4140307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:11,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43777 samples/s/p 1:06:47 } +2024-07-26 00:06:14,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 528/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.4105901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:14,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43640 samples/s/p 1:06:45 } +2024-07-26 00:06:17,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 530/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 3.4071522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:17,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43658 samples/s/p 1:06:42 } +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 532/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 3.4037148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43576 samples/s/p 1:06:40 } +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 534/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 3.400282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43752 samples/s/p 1:06:35 } +2024-07-26 00:06:26,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 536/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.39685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:26,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43501 samples/s/p 1:06:34 } +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 538/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.3934198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43790 samples/s/p 1:06:29 } +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 540/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.3899928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43633 samples/s/p 1:06:27 } +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 542/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 3.386568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.44233 samples/s/p 1:06:20 } +2024-07-26 00:06:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 544/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.3831452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43593 samples/s/p 1:06:22 } +2024-07-26 00:06:41,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 546/ 1625], loss: 1.099, per_step_time: 1473ms, lr: 3.3797246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:41,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43086 samples/s/p 1:06:23 } +2024-07-26 00:06:44,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 548/ 1625], loss: 1.089, per_step_time: 1468ms, lr: 3.3763054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.44629 samples/s/p 1:06:08 } +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 550/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3728916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43338 samples/s/p 1:06:15 } +2024-07-26 00:06:49,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 552/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 3.369476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:49,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43235 samples/s/p 1:06:13 } +2024-07-26 00:06:52,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 554/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 3.366064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:52,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43762 samples/s/p 1:06:06 } +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 556/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 3.3626561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43416 samples/s/p 1:06:06 } +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 558/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3592482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43209 samples/s/p 1:06:04 } +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 560/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 3.3558422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43850 samples/s/p 1:05:56 } +2024-07-26 00:07:04,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 562/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 3.3524425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43373 samples/s/p 1:05:57 } +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 564/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 3.3490414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43087 samples/s/p 1:05:56 } +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 566/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 3.345643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.42866 samples/s/p 1:05:55 } +2024-07-26 00:07:13,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 568/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 3.3422466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:13,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43551 samples/s/p 1:05:47 } +2024-07-26 00:07:16,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 570/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 3.3388533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:16,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.44055 samples/s/p 1:05:40 } +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 572/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.3354622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43372 samples/s/p 1:05:42 } +2024-07-26 00:07:22,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 574/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 3.3320725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:22,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43411 samples/s/p 1:05:39 } +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 576/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.3286851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:25,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43164 samples/s/p 1:05:38 } +2024-07-26 00:07:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 578/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.325301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43727 samples/s/p 1:05:31 } +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 580/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.321918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:31,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43324 samples/s/p 1:05:31 } +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 582/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 3.318538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.42967 samples/s/p 1:05:30 } +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 584/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.3151605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43150 samples/s/p 1:05:26 } +2024-07-26 00:07:40,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 586/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 3.3117835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:40,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43393 samples/s/p 1:05:22 } +2024-07-26 00:07:43,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 588/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 3.3084107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:43,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43724 samples/s/p 1:05:16 } +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 590/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 3.3050396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43125 samples/s/p 1:05:18 } +2024-07-26 00:07:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 592/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 3.3016709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43984 samples/s/p 1:05:08 } +2024-07-26 00:07:51,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 594/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.2983044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:51,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43450 samples/s/p 1:05:09 } +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 596/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 3.2949383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43040 samples/s/p 1:05:09 } +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 598/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 3.2915755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43526 samples/s/p 1:05:03 } +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 600/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 3.2882176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43226 samples/s/p 1:05:02 } +2024-07-26 00:08:03,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 602/ 1625], loss: 1.340, per_step_time: 1470ms, lr: 3.2848575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:03,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.44144 samples/s/p 1:04:53 } +2024-07-26 00:08:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 604/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 3.281505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:06,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43675 samples/s/p 1:04:53 } +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 606/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 3.2781509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:09,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.42784 samples/s/p 1:04:56 } +2024-07-26 00:08:12,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 608/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 3.274798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:12,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43273 samples/s/p 1:04:50 } +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 610/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 3.271452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43879 samples/s/p 1:04:43 } +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 612/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.2681055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43690 samples/s/p 1:04:41 } +2024-07-26 00:08:21,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 614/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 3.2647613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:21,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43577 samples/s/p 1:04:39 } +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 616/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 3.2614184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:24,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43051 samples/s/p 1:04:40 } +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 618/ 1625], loss: 1.291, per_step_time: 1470ms, lr: 3.2580788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43877 samples/s/p 1:04:31 } +2024-07-26 00:08:30,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 620/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.2547418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:30,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43780 samples/s/p 1:04:29 } +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 622/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 3.2514067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43750 samples/s/p 1:04:26 } +2024-07-26 00:08:36,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 624/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 3.2480734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:36,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43768 samples/s/p 1:04:23 } +2024-07-26 00:08:39,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 626/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 3.2447433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:39,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.44187 samples/s/p 1:04:17 } +2024-07-26 00:08:42,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 628/ 1625], loss: 1.020, per_step_time: 1470ms, lr: 3.241415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:42,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43891 samples/s/p 1:04:16 } +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 630/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.2380885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43525 samples/s/p 1:04:16 } +2024-07-26 00:08:47,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 632/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.2347662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:47,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42981 samples/s/p 1:04:17 } +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 634/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 3.2314433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:50,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42952 samples/s/p 1:04:14 } +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 636/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 3.2281246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43490 samples/s/p 1:04:07 } +2024-07-26 00:08:56,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 638/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.224808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:56,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43610 samples/s/p 1:04:03 } +2024-07-26 00:08:59,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 640/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 3.221492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:59,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42939 samples/s/p 1:04:05 } +2024-07-26 00:09:02,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 642/ 1625], loss: 1.075, per_step_time: 1473ms, lr: 3.2181792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:02,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.42838 samples/s/p 1:04:03 } +2024-07-26 00:09:05,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 644/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 3.214871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:05,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43514 samples/s/p 1:03:55 } +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 646/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 3.2115609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43458 samples/s/p 1:03:53 } +2024-07-26 00:09:11,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 648/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.2082567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:11,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43784 samples/s/p 1:03:47 } +2024-07-26 00:09:14,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 650/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 3.2049534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:14,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43610 samples/s/p 1:03:46 } +2024-07-26 00:09:17,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 652/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 3.20165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:17,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.44276 samples/s/p 1:03:38 } +2024-07-26 00:09:20,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 654/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 3.1983536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:20,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43774 samples/s/p 1:03:39 } +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 656/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 3.1950567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43205 samples/s/p 1:03:40 } +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 658/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 3.1917602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43490 samples/s/p 1:03:35 } +2024-07-26 00:09:29,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 660/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 3.1884701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:29,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43534 samples/s/p 1:03:32 } +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 662/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 3.1851805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43734 samples/s/p 1:03:27 } +2024-07-26 00:09:35,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 664/ 1625], loss: 0.933, per_step_time: 1478ms, lr: 3.1818931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.41028 samples/s/p 1:03:43 } +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 666/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 3.1786071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43323 samples/s/p 1:03:24 } +2024-07-26 00:09:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 668/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 3.1753243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:41,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43027 samples/s/p 1:03:23 } +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 670/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 3.1720447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43175 samples/s/p 1:03:19 } +2024-07-26 00:09:47,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 672/ 1625], loss: 1.009, per_step_time: 1475ms, lr: 3.1687646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:47,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.42177 samples/s/p 1:03:23 } +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 674/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 3.1654881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:49,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43315 samples/s/p 1:03:13 } +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 676/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 3.1622171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43021 samples/s/p 1:03:12 } +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 678/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 3.1589434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43979 samples/s/p 1:03:02 } +2024-07-26 00:09:58,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 680/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.1556738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:58,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43747 samples/s/p 1:03:01 } +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 682/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 3.1524087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43273 samples/s/p 1:03:01 } +2024-07-26 00:10:04,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 684/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.1491418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:04,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43553 samples/s/p 1:02:56 } +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 686/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.1458799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43644 samples/s/p 1:02:53 } +2024-07-26 00:10:10,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 688/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.1426216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:10,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43411 samples/s/p 1:02:51 } +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 690/ 1625], loss: 1.115, per_step_time: 1469ms, lr: 3.1393615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.44292 samples/s/p 1:02:42 } +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 692/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 3.1361074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43625 samples/s/p 1:02:44 } +2024-07-26 00:10:19,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 694/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 3.1328536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:19,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43894 samples/s/p 1:02:39 } +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 696/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 3.1296004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.42946 samples/s/p 1:02:43 } +2024-07-26 00:10:25,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 698/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.1263544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:25,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43507 samples/s/p 1:02:36 } +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 700/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.123107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43660 samples/s/p 1:02:32 } +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 702/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 3.119862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43482 samples/s/p 1:02:30 } +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 704/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 3.116621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43300 samples/s/p 1:02:28 } +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 706/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 3.1133818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43068 samples/s/p 1:02:27 } +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 708/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 3.110144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43968 samples/s/p 1:02:18 } +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 710/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 3.106909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:43,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43998 samples/s/p 1:02:15 } +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 712/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 3.1036766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43316 samples/s/p 1:02:17 } +2024-07-26 00:10:49,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 714/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 3.100446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:49,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43161 samples/s/p 1:02:15 } +2024-07-26 00:10:51,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 716/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.0972174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:51,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43245 samples/s/p 1:02:11 } +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 718/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 3.093991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43535 samples/s/p 1:02:06 } +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 720/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.090769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43606 samples/s/p 1:02:03 } +2024-07-26 00:11:00,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 722/ 1625], loss: 1.131, per_step_time: 1474ms, lr: 3.0875462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:00,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.42491 samples/s/p 1:02:07 } +2024-07-26 00:11:03,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 724/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 3.0843275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:03,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43455 samples/s/p 1:01:58 } +2024-07-26 00:11:06,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 726/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 3.0811125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:06,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43691 samples/s/p 1:01:53 } +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 728/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 3.0778956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43232 samples/s/p 1:01:54 } +2024-07-26 00:11:12,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 730/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 3.0746833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43624 samples/s/p 1:01:48 } +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 732/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 3.071475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:15,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42817 samples/s/p 1:01:51 } +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 734/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 3.0682659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42568 samples/s/p 1:01:49 } +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 736/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 3.0650622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43020 samples/s/p 1:01:43 } +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 738/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 3.0618598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:24,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43565 samples/s/p 1:01:37 } +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 740/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.058657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:27,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43740 samples/s/p 1:01:32 } +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 742/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 3.0554602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43555 samples/s/p 1:01:31 } +2024-07-26 00:11:33,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 744/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.0522642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:33,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43554 samples/s/p 1:01:28 } +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 746/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 3.0490683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42860 samples/s/p 1:01:30 } +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 748/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 3.045879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43442 samples/s/p 1:01:23 } +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 750/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 3.042689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42957 samples/s/p 1:01:23 } +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 752/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 3.0395022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43830 samples/s/p 1:01:14 } +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 754/ 1625], loss: 1.324, per_step_time: 1471ms, lr: 3.0363185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43503 samples/s/p 1:01:13 } +2024-07-26 00:11:50,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 756/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 3.0331362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:50,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44209 samples/s/p 1:01:06 } +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 758/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 3.0299557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:53,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43232 samples/s/p 1:01:09 } +2024-07-26 00:11:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 760/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 3.026778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42967 samples/s/p 1:01:08 } +2024-07-26 00:11:59,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 762/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 3.0236024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43272 samples/s/p 1:01:03 } +2024-07-26 00:12:02,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 764/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 3.0204305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:02,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42962 samples/s/p 1:01:02 } +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 766/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 3.0172578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:05,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43903 samples/s/p 1:00:53 } +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 768/ 1625], loss: 1.183, per_step_time: 1468ms, lr: 3.0140895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44630 samples/s/p 1:00:45 } +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 770/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 3.0109254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43331 samples/s/p 1:00:51 } +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 772/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 3.0077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44033 samples/s/p 1:00:43 } +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 774/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 3.004599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43597 samples/s/p 1:00:43 } +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 776/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.0014398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:20,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43975 samples/s/p 1:00:38 } +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 778/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9982812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43408 samples/s/p 1:00:39 } +2024-07-26 00:12:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 780/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.9951293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:26,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44074 samples/s/p 1:00:31 } +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 782/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.9919756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:29,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43510 samples/s/p 1:00:32 } +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 784/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.9888242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43445 samples/s/p 1:00:30 } +2024-07-26 00:12:35,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 786/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9856783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:35,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43710 samples/s/p 1:00:25 } +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 788/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9825324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43341 samples/s/p 1:00:24 } +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 790/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9793891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:41,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43283 samples/s/p 1:00:22 } +2024-07-26 00:12:44,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 792/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9762482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:44,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43877 samples/s/p 1:00:15 } +2024-07-26 00:12:47,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 794/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.97311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:47,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43265 samples/s/p 1:00:16 } +2024-07-26 00:12:50,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 796/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.9699736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:50,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.42920 samples/s/p 1:00:16 } +2024-07-26 00:12:52,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 798/ 1625], loss: 1.240, per_step_time: 1469ms, lr: 2.96684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:52,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.44271 samples/s/p 1:00:04 } +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 800/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43371 samples/s/p 1:00:07 } +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 802/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.960579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43428 samples/s/p 1:00:03 } +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 804/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9574521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43356 samples/s/p 1:00:01 } +2024-07-26 00:13:04,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 806/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.954328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:04,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42786 samples/s/p 1:00:02 } +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 808/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 2.9512053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43043 samples/s/p 0:59:57 } +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 810/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.9480843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:10,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.44131 samples/s/p 0:59:47 } +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 812/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.944967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43593 samples/s/p 0:59:47 } +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 814/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.941853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42859 samples/s/p 0:59:49 } +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 816/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9387393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43143 samples/s/p 0:59:45 } +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9356302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43287 samples/s/p 0:59:41 } +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 820/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9325206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43323 samples/s/p 0:59:37 } +2024-07-26 00:13:28,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 822/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.9294138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:28,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43330 samples/s/p 0:59:34 } +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 824/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.926312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43211 samples/s/p 0:59:32 } +2024-07-26 00:13:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 826/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.9232092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:34,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43318 samples/s/p 0:59:29 } +2024-07-26 00:13:37,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 828/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 2.9201092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:37,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43331 samples/s/p 0:59:26 } +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 830/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.9170133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43391 samples/s/p 0:59:22 } +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 832/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.91392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43270 samples/s/p 0:59:20 } +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 834/ 1625], loss: 1.292, per_step_time: 1470ms, lr: 2.9108269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43856 samples/s/p 0:59:13 } +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 836/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9077378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43960 samples/s/p 0:59:10 } +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 838/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.9046491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43877 samples/s/p 0:59:07 } +2024-07-26 00:13:54,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 840/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9015653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:54,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43646 samples/s/p 0:59:06 } +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 842/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.8984814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:57,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43658 samples/s/p 0:59:03 } +2024-07-26 00:14:00,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 844/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 2.8954005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43145 samples/s/p 0:59:03 } +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 846/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.8923228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:03,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43635 samples/s/p 0:58:57 } +2024-07-26 00:14:06,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 848/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.8892468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:06,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43798 samples/s/p 0:58:53 } +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 850/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8861737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:09,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43835 samples/s/p 0:58:50 } +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 852/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.8831018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43028 samples/s/p 0:58:52 } +2024-07-26 00:14:15,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 854/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8800328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:15,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43196 samples/s/p 0:58:48 } +2024-07-26 00:14:18,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 856/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.8769664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:18,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43113 samples/s/p 0:58:46 } +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 858/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.8739028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:21,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43867 samples/s/p 0:58:38 } +2024-07-26 00:14:24,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 860/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.8708405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:24,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43800 samples/s/p 0:58:35 } +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 862/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 2.8677819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:27,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43345 samples/s/p 0:58:35 } +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 864/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.864725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43556 samples/s/p 0:58:31 } +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 866/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.861669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:33,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43549 samples/s/p 0:58:28 } +2024-07-26 00:14:36,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 868/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.8586173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:36,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43368 samples/s/p 0:58:27 } +2024-07-26 00:14:39,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 870/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 2.8555673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:39,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43652 samples/s/p 0:58:22 } +2024-07-26 00:14:42,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 872/ 1625], loss: 1.303, per_step_time: 1471ms, lr: 2.8525174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:42,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43486 samples/s/p 0:58:20 } +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 874/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 2.8494742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.44347 samples/s/p 0:58:11 } +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.846431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43531 samples/s/p 0:58:14 } +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 878/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8433897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43629 samples/s/p 0:58:10 } +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 880/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.840351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43243 samples/s/p 0:58:10 } +2024-07-26 00:14:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 882/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8373138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43793 samples/s/p 0:58:03 } +2024-07-26 00:14:59,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 884/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.834281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:59,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43643 samples/s/p 0:58:01 } +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 886/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.8312493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43550 samples/s/p 0:57:59 } +2024-07-26 00:15:05,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 888/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.8282202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:05,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43959 samples/s/p 0:57:53 } +2024-07-26 00:15:08,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 890/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.8251925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:08,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43203 samples/s/p 0:57:55 } +2024-07-26 00:15:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 892/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.8221684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:11,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43643 samples/s/p 0:57:49 } +2024-07-26 00:15:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 894/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.8191462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:14,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44044 samples/s/p 0:57:44 } +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 896/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.8161264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43852 samples/s/p 0:57:42 } +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 898/ 1625], loss: 1.000, per_step_time: 1469ms, lr: 2.8131085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:20,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44288 samples/s/p 0:57:36 } +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 900/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 2.810094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43120 samples/s/p 0:57:41 } +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.8070801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43149 samples/s/p 0:57:38 } +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 904/ 1625], loss: 0.917, per_step_time: 1471ms, lr: 2.8040708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43654 samples/s/p 0:57:32 } +2024-07-26 00:15:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 906/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.801064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:32,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43571 samples/s/p 0:57:29 } +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 908/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.7980554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43775 samples/s/p 0:57:25 } +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 910/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.795052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43432 samples/s/p 0:57:24 } +2024-07-26 00:15:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 912/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.7920532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.42861 samples/s/p 0:57:25 } +2024-07-26 00:15:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 914/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.7890542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43262 samples/s/p 0:57:19 } +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 916/ 1625], loss: 0.870, per_step_time: 1472ms, lr: 2.7860576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43216 samples/s/p 0:57:17 } +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 918/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7830638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43660 samples/s/p 0:57:11 } +2024-07-26 00:15:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 920/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7800718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43587 samples/s/p 0:57:09 } +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 922/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.7770823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:55,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43542 samples/s/p 0:57:06 } +2024-07-26 00:15:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 924/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 2.7740953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:58,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43406 samples/s/p 0:57:04 } +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 926/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.771111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43407 samples/s/p 0:57:01 } +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 928/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.7681276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:04,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43281 samples/s/p 0:56:59 } +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 930/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.7651486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43551 samples/s/p 0:56:54 } +2024-07-26 00:16:10,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 932/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7621702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:10,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43843 samples/s/p 0:56:49 } +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 934/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.7591964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:13,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.42971 samples/s/p 0:56:52 } +2024-07-26 00:16:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 936/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.7562223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43297 samples/s/p 0:56:47 } +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 938/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.7532528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43880 samples/s/p 0:56:40 } +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 940/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.750283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43500 samples/s/p 0:56:40 } +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 942/ 1625], loss: 1.108, per_step_time: 1475ms, lr: 2.747317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:25,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.42126 samples/s/p 0:56:45 } +2024-07-26 00:16:28,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 944/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.744356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:28,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43326 samples/s/p 0:56:35 } +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 946/ 1625], loss: 0.959, per_step_time: 1470ms, lr: 2.7413932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43964 samples/s/p 0:56:28 } +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 948/ 1625], loss: 0.966, per_step_time: 1470ms, lr: 2.738434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:34,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43873 samples/s/p 0:56:26 } +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 950/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.735479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44157 samples/s/p 0:56:21 } +2024-07-26 00:16:40,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 952/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.732524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43443 samples/s/p 0:56:22 } +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 954/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7295719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:43,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43111 samples/s/p 0:56:21 } +2024-07-26 00:16:46,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 956/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7266237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:46,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43390 samples/s/p 0:56:17 } +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 958/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.7236756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:49,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43178 samples/s/p 0:56:15 } +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 960/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.720732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43147 samples/s/p 0:56:12 } +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 962/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.7177894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:54,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43792 samples/s/p 0:56:05 } +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 964/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.714848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43609 samples/s/p 0:56:04 } +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 966/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.7119122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.44194 samples/s/p 0:55:57 } +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 968/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.7089773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43248 samples/s/p 0:56:00 } +2024-07-26 00:17:06,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 970/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.7060437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:06,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43579 samples/s/p 0:55:55 } +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 972/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.703113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.42931 samples/s/p 0:55:56 } +2024-07-26 00:17:12,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 974/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.700185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:12,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43766 samples/s/p 0:55:48 } +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 976/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.6972593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43362 samples/s/p 0:55:48 } +2024-07-26 00:17:18,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6943355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:18,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43230 samples/s/p 0:55:45 } +2024-07-26 00:17:21,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 980/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 2.6914145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:21,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.42981 samples/s/p 0:55:44 } +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 982/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6884966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43764 samples/s/p 0:55:36 } +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 984/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.6855796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43578 samples/s/p 0:55:34 } +2024-07-26 00:17:30,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 986/ 1625], loss: 1.115, per_step_time: 1474ms, lr: 2.6826654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:30,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42665 samples/s/p 0:55:37 } +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 988/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.679756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42721 samples/s/p 0:55:34 } +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 990/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.6768446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:36,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43374 samples/s/p 0:55:27 } +2024-07-26 00:17:39,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 992/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.673938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:39,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43629 samples/s/p 0:55:22 } +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 994/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.671035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43714 samples/s/p 0:55:19 } +2024-07-26 00:17:45,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 996/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.668131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:45,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42684 samples/s/p 0:55:22 } +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 998/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.6652315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43764 samples/s/p 0:55:13 } +2024-07-26 00:17:51,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1000/ 1625], loss: 1.319, per_step_time: 1469ms, lr: 2.662336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44290 samples/s/p 0:55:07 } +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1002/ 1625], loss: 1.150, per_step_time: 2292ms, lr: 2.659439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 3.48909 samples/s/p 1:25:54 } +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1004/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.656548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.42527 samples/s/p 0:55:11 } +2024-07-26 00:18:32,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1006/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.653658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:32,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44477 samples/s/p 0:54:57 } +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1008/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.6507678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43741 samples/s/p 0:54:58 } +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1010/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.6478838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43279 samples/s/p 0:54:58 } +2024-07-26 00:18:41,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1012/ 1625], loss: 0.992, per_step_time: 1471ms, lr: 2.6450007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:41,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43609 samples/s/p 0:54:53 } +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1014/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.6421183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43785 samples/s/p 0:54:49 } +2024-07-26 00:18:47,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1016/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.639241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:47,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43349 samples/s/p 0:54:49 } +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1018/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.6363648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:50,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44153 samples/s/p 0:54:41 } +2024-07-26 00:18:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1020/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.633492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43639 samples/s/p 0:54:41 } +2024-07-26 00:18:56,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1022/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 2.6306209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:56,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44024 samples/s/p 0:54:36 } +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1024/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.6277507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43242 samples/s/p 0:54:38 } +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1026/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6248856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43683 samples/s/p 0:54:32 } +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1028/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.6220205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43538 samples/s/p 0:54:30 } +2024-07-26 00:19:08,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1030/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.619159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:08,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43369 samples/s/p 0:54:28 } +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1032/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.616301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43187 samples/s/p 0:54:26 } +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1034/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.613442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43198 samples/s/p 0:54:23 } +2024-07-26 00:19:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1036/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.6105872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:17,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43354 samples/s/p 0:54:19 } +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1038/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.6077369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:20,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43292 samples/s/p 0:54:17 } +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1040/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.6048856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43157 samples/s/p 0:54:15 } +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1042/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.6020389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:26,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43242 samples/s/p 0:54:11 } +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1044/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5991944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43697 samples/s/p 0:54:05 } +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1046/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.44104 samples/s/p 0:54:00 } +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1048/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.593511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43130 samples/s/p 0:54:03 } +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1050/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 2.590673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:37,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43750 samples/s/p 0:53:56 } +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1052/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.5878362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.42948 samples/s/p 0:53:58 } +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1054/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.585004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43111 samples/s/p 0:53:54 } +2024-07-26 00:19:46,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1056/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 2.5821737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43408 samples/s/p 0:53:49 } +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1058/ 1625], loss: 1.155, per_step_time: 1478ms, lr: 2.5793431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:49,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.41137 samples/s/p 0:54:00 } +2024-07-26 00:19:52,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1060/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 2.5765178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:52,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43261 samples/s/p 0:53:44 } +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1062/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 2.573695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43918 samples/s/p 0:53:38 } +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1064/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.5708741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43482 samples/s/p 0:53:37 } +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1066/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.568054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43331 samples/s/p 0:53:35 } +2024-07-26 00:20:04,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1068/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.5652375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:04,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.42669 samples/s/p 0:53:36 } +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1070/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 2.5624233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43377 samples/s/p 0:53:29 } +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1072/ 1625], loss: 1.112, per_step_time: 1477ms, lr: 2.5596119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.41455 samples/s/p 0:53:37 } +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1074/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.556802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43696 samples/s/p 0:53:21 } +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1076/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.5539966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43248 samples/s/p 0:53:21 } +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1078/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.5511913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43911 samples/s/p 0:53:14 } +2024-07-26 00:20:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1080/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5483885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:22,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43223 samples/s/p 0:53:15 } +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1082/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.54559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42961 samples/s/p 0:53:14 } +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1084/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.5427914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44229 samples/s/p 0:53:03 } +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1086/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.5399972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:31,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43060 samples/s/p 0:53:07 } +2024-07-26 00:20:33,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1088/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.5372049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:33,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43414 samples/s/p 0:53:02 } +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1090/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 2.5344134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44010 samples/s/p 0:52:56 } +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1092/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 2.5316276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:39,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42622 samples/s/p 0:53:01 } +2024-07-26 00:20:42,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1094/ 1625], loss: 1.074, per_step_time: 1475ms, lr: 2.5288423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:42,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42292 samples/s/p 0:53:00 } +2024-07-26 00:20:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1096/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 2.5260574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:45,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43140 samples/s/p 0:52:52 } +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1098/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.523278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43267 samples/s/p 0:52:48 } +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1100/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 2.5204995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43014 samples/s/p 0:52:47 } +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1102/ 1625], loss: 1.340, per_step_time: 1473ms, lr: 2.5177233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42924 samples/s/p 0:52:45 } +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1104/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 2.514951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43509 samples/s/p 0:52:38 } +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.512179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:00,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43379 samples/s/p 0:52:36 } +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1108/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.50941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43038 samples/s/p 0:52:35 } +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1110/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.5066433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43124 samples/s/p 0:52:32 } +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1112/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 2.5038803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.44391 samples/s/p 0:52:21 } +2024-07-26 00:21:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1114/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 2.501119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:12,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43525 samples/s/p 0:52:23 } +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1116/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.4983597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43433 samples/s/p 0:52:21 } +2024-07-26 00:21:18,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1118/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.4956034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:18,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42853 samples/s/p 0:52:21 } +2024-07-26 00:21:21,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1120/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.49285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:21,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43515 samples/s/p 0:52:15 } +2024-07-26 00:21:24,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1122/ 1625], loss: 1.030, per_step_time: 1474ms, lr: 2.4900962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:24,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42702 samples/s/p 0:52:16 } +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1124/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.487347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43183 samples/s/p 0:52:11 } +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1126/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.4846013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43137 samples/s/p 0:52:08 } +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1128/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.4818555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43901 samples/s/p 0:52:01 } +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1130/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.4791148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.42788 samples/s/p 0:52:04 } +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1132/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.4763742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:38,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43711 samples/s/p 0:51:56 } +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1134/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.4736355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:41,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43095 samples/s/p 0:51:56 } +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1136/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.4709016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43141 samples/s/p 0:51:53 } +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1138/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.468169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43310 samples/s/p 0:51:49 } +2024-07-26 00:21:50,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1140/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.4654378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:50,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43206 samples/s/p 0:51:47 } +2024-07-26 00:21:53,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1142/ 1625], loss: 1.329, per_step_time: 1473ms, lr: 2.462711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:53,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43071 samples/s/p 0:51:45 } +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1144/ 1625], loss: 0.891, per_step_time: 1471ms, lr: 2.4599851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43758 samples/s/p 0:51:38 } +2024-07-26 00:21:59,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1146/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.4572619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:59,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43386 samples/s/p 0:51:37 } +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1148/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.454542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43029 samples/s/p 0:51:36 } +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1150/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.451823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:05,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43890 samples/s/p 0:51:28 } +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1152/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.4491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:08,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43704 samples/s/p 0:51:26 } +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1154/ 1625], loss: 1.103, per_step_time: 1474ms, lr: 2.4463939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42564 samples/s/p 0:51:30 } +2024-07-26 00:22:14,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1156/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.4436843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:14,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43968 samples/s/p 0:51:19 } +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1158/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.4409746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43606 samples/s/p 0:51:18 } +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1160/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.438269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43364 samples/s/p 0:51:17 } +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1162/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.4355654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43432 samples/s/p 0:51:13 } +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1164/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.4328629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43466 samples/s/p 0:51:10 } +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1166/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4301635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:29,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43388 samples/s/p 0:51:08 } +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1168/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.427468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.42465 samples/s/p 0:51:10 } +2024-07-26 00:22:34,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1170/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.424775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:34,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.44054 samples/s/p 0:50:58 } +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1172/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.4220817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:37,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43365 samples/s/p 0:50:59 } +2024-07-26 00:22:40,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1174/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 2.4193941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:40,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43900 samples/s/p 0:50:53 } +2024-07-26 00:22:43,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1176/ 1625], loss: 1.135, per_step_time: 1469ms, lr: 2.416707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:43,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.44239 samples/s/p 0:50:48 } +2024-07-26 00:22:46,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1178/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.4140209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:46,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43250 samples/s/p 0:50:51 } +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1180/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.41134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43760 samples/s/p 0:50:45 } +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1182/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4086607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:52,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43991 samples/s/p 0:50:41 } +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1184/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.4059823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43542 samples/s/p 0:50:40 } +2024-07-26 00:22:58,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1186/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.4033093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:58,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43597 samples/s/p 0:50:37 } +2024-07-26 00:23:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1188/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.4006358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:01,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43449 samples/s/p 0:50:35 } +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1190/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.3979662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43073 samples/s/p 0:50:34 } +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1192/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.3952991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43642 samples/s/p 0:50:28 } +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1194/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.3926336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43613 samples/s/p 0:50:25 } +2024-07-26 00:23:13,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1196/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 2.3899709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:13,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43422 samples/s/p 0:50:23 } +2024-07-26 00:23:16,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1198/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.38731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:16,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43453 samples/s/p 0:50:20 } +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1200/ 1625], loss: 1.066, per_step_time: 1484ms, lr: 2.3846521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.38789 samples/s/p 0:50:43 } +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1202/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3819962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43307 samples/s/p 0:50:15 } +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1204/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.3793439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43987 samples/s/p 0:50:08 } +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1206/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.3766931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43645 samples/s/p 0:50:07 } +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1208/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.374045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43471 samples/s/p 0:50:05 } +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1210/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3713997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43128 samples/s/p 0:50:04 } +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1212/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3687567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43796 samples/s/p 0:49:58 } +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1214/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.3661146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43161 samples/s/p 0:49:58 } +2024-07-26 00:23:42,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1216/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.363476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:42,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43397 samples/s/p 0:49:54 } +2024-07-26 00:23:45,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1218/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3608425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43258 samples/s/p 0:49:52 } +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1220/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 2.3582083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43059 samples/s/p 0:49:50 } +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1222/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.3555756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43845 samples/s/p 0:49:43 } +2024-07-26 00:23:54,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1224/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.3529483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:54,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43495 samples/s/p 0:49:42 } +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1226/ 1625], loss: 1.151, per_step_time: 1474ms, lr: 2.3503226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.42639 samples/s/p 0:49:43 } +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1228/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 2.3476969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.42958 samples/s/p 0:49:39 } +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1230/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.3450757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43138 samples/s/p 0:49:35 } +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1232/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.3424568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43523 samples/s/p 0:49:30 } +2024-07-26 00:24:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1234/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.3398406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44117 samples/s/p 0:49:24 } +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1236/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.3372272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43901 samples/s/p 0:49:22 } +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1238/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.3346147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:15,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43779 samples/s/p 0:49:20 } +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1240/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 2.3320054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43432 samples/s/p 0:49:18 } +2024-07-26 00:24:21,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3293978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:21,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43156 samples/s/p 0:49:17 } +2024-07-26 00:24:24,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1244/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.326794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43241 samples/s/p 0:49:14 } +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1246/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.3241914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43632 samples/s/p 0:49:09 } +2024-07-26 00:24:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1248/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.3215916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42582 samples/s/p 0:49:11 } +2024-07-26 00:24:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1250/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.3189946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43061 samples/s/p 0:49:06 } +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1252/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.3164002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43298 samples/s/p 0:49:02 } +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1254/ 1625], loss: 1.057, per_step_time: 1472ms, lr: 2.3138073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43464 samples/s/p 0:48:58 } +2024-07-26 00:24:41,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1256/ 1625], loss: 1.316, per_step_time: 1474ms, lr: 2.3112189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:41,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42651 samples/s/p 0:48:59 } +2024-07-26 00:24:44,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1258/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 2.3086304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:44,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43214 samples/s/p 0:48:53 } +2024-07-26 00:24:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1260/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.3060452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44087 samples/s/p 0:48:46 } +2024-07-26 00:24:50,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1262/ 1625], loss: 1.269, per_step_time: 1474ms, lr: 2.3034638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:50,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.42673 samples/s/p 0:48:50 } +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1264/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3008822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43357 samples/s/p 0:48:44 } +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1266/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.298304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43713 samples/s/p 0:48:39 } +2024-07-26 00:24:59,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1268/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.295731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:59,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43528 samples/s/p 0:48:37 } +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1270/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 2.2931574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43955 samples/s/p 0:48:32 } +2024-07-26 00:25:05,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1272/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 2.290587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44443 samples/s/p 0:48:26 } +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1274/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.2880185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43741 samples/s/p 0:48:27 } +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1276/ 1625], loss: 1.382, per_step_time: 1473ms, lr: 2.2854533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42903 samples/s/p 0:48:28 } +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1278/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 2.2828908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43498 samples/s/p 0:48:22 } +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1280/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 2.28033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44226 samples/s/p 0:48:15 } +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1282/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2777717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:20,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44052 samples/s/p 0:48:13 } +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1284/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.275216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43762 samples/s/p 0:48:12 } +2024-07-26 00:25:26,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1286/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 2.2726622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42767 samples/s/p 0:48:14 } +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1288/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2701108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43631 samples/s/p 0:48:07 } +2024-07-26 00:25:32,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1290/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.267563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:32,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43707 samples/s/p 0:48:03 } +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1292/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.265017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:35,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43795 samples/s/p 0:48:00 } +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1294/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 2.2624724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:37,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43464 samples/s/p 0:47:59 } +2024-07-26 00:25:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1296/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.2599315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:40,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.42574 samples/s/p 0:48:01 } +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1298/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 2.2573931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:43,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43733 samples/s/p 0:47:51 } +2024-07-26 00:25:46,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1300/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.254859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:46,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43615 samples/s/p 0:47:49 } +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1302/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 2.2523225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:49,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.42936 samples/s/p 0:47:50 } +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1304/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.2497911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43557 samples/s/p 0:47:44 } +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1306/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.2472648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43309 samples/s/p 0:47:42 } +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1308/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.244736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43965 samples/s/p 0:47:36 } +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1310/ 1625], loss: 1.267, per_step_time: 1475ms, lr: 2.2422114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42073 samples/s/p 0:47:43 } +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1312/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.239692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43094 samples/s/p 0:47:34 } +2024-07-26 00:26:07,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1314/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.237171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:07,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43343 samples/s/p 0:47:30 } +2024-07-26 00:26:10,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1316/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 2.234656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:10,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42411 samples/s/p 0:47:32 } +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1318/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.2321428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43230 samples/s/p 0:47:25 } +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1320/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 2.2296304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43236 samples/s/p 0:47:22 } +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1322/ 1625], loss: 1.075, per_step_time: 1474ms, lr: 2.2271213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42390 samples/s/p 0:47:23 } +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1324/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 2.224614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43095 samples/s/p 0:47:17 } +2024-07-26 00:26:25,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1326/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.2221093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:25,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42998 samples/s/p 0:47:14 } +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1328/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.2196073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43195 samples/s/p 0:47:10 } +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1330/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.217108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42589 samples/s/p 0:47:10 } +2024-07-26 00:26:34,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.21461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:34,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43509 samples/s/p 0:47:03 } +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1334/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 2.2121158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:37,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43662 samples/s/p 0:46:59 } +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1336/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2096242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43534 samples/s/p 0:46:57 } +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1338/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.2071342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:42,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43411 samples/s/p 0:46:54 } +2024-07-26 00:26:45,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1340/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.204648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:45,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43443 samples/s/p 0:46:51 } +2024-07-26 00:26:48,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1342/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.2021622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:48,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43840 samples/s/p 0:46:46 } +2024-07-26 00:26:51,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1344/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.1996816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:51,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43010 samples/s/p 0:46:48 } +2024-07-26 00:26:54,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1346/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.1971996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:54,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43565 samples/s/p 0:46:42 } +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1348/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 2.1947226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43394 samples/s/p 0:46:40 } +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1350/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.192249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:00,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43420 samples/s/p 0:46:37 } +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1352/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.1897754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43509 samples/s/p 0:46:33 } +2024-07-26 00:27:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1354/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.1873045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43659 samples/s/p 0:46:29 } +2024-07-26 00:27:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1356/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.1848386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:09,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43511 samples/s/p 0:46:27 } +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1358/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 2.182372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43919 samples/s/p 0:46:22 } +2024-07-26 00:27:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1360/ 1625], loss: 1.318, per_step_time: 1470ms, lr: 2.1799106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:15,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.44216 samples/s/p 0:46:18 } +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1362/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.1774501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43524 samples/s/p 0:46:18 } +2024-07-26 00:27:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1364/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 2.1749913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:21,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43373 samples/s/p 0:46:16 } +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1366/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1725377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43455 samples/s/p 0:46:13 } +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1368/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.1700848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43064 samples/s/p 0:46:12 } +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1370/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.1676337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.42984 samples/s/p 0:46:09 } +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1372/ 1625], loss: 1.053, per_step_time: 1470ms, lr: 2.1651854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43857 samples/s/p 0:46:02 } +2024-07-26 00:27:36,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1374/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1627402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:36,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43771 samples/s/p 0:45:59 } +2024-07-26 00:27:39,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1376/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.160297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:39,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43596 samples/s/p 0:45:57 } +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1378/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.1578562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43352 samples/s/p 0:45:56 } +2024-07-26 00:27:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1380/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.1554192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43198 samples/s/p 0:45:54 } +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1382/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.1529827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43610 samples/s/p 0:45:49 } +2024-07-26 00:27:50,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1384/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.1505498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:50,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43244 samples/s/p 0:45:47 } +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1386/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.1481196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:53,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.42940 samples/s/p 0:45:46 } +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1388/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.1456926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43544 samples/s/p 0:45:40 } +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1390/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.1432647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.44072 samples/s/p 0:45:34 } +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1392/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.1408423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43267 samples/s/p 0:45:36 } +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1394/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.1384217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43641 samples/s/p 0:45:31 } +2024-07-26 00:28:08,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1396/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1360033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:08,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43007 samples/s/p 0:45:31 } +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1398/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1335868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43741 samples/s/p 0:45:24 } +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1400/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1311748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43617 samples/s/p 0:45:22 } +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1402/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.1287624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43646 samples/s/p 0:45:19 } +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1404/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1263554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.42928 samples/s/p 0:45:20 } +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1406/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.1239493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43617 samples/s/p 0:45:13 } +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1408/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.1215442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43495 samples/s/p 0:45:11 } +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1410/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.119145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43798 samples/s/p 0:45:06 } +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1412/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.1167457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43406 samples/s/p 0:45:05 } +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1414/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.1143492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43466 samples/s/p 0:45:02 } +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1416/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 2.111955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43643 samples/s/p 0:44:58 } +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1418/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.1095645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43677 samples/s/p 0:44:55 } +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1420/ 1625], loss: 1.351, per_step_time: 1470ms, lr: 2.1071755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43961 samples/s/p 0:44:51 } +2024-07-26 00:28:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1422/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1047895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43602 samples/s/p 0:44:50 } +2024-07-26 00:28:49,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1424/ 1625], loss: 0.926, per_step_time: 1471ms, lr: 2.1024048e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:49,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43821 samples/s/p 0:44:46 } +2024-07-26 00:28:52,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1426/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.1000246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:52,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43652 samples/s/p 0:44:44 } +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1428/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.0976454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.42830 samples/s/p 0:44:45 } +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1430/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.0952687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:58,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.44140 samples/s/p 0:44:35 } +2024-07-26 00:29:01,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1432/ 1625], loss: 0.986, per_step_time: 1472ms, lr: 2.0928962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:01,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43228 samples/s/p 0:44:37 } +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1434/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.0905238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43645 samples/s/p 0:44:32 } +2024-07-26 00:29:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1436/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.088154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:07,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43408 samples/s/p 0:44:30 } +2024-07-26 00:29:10,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1438/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.0857894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:10,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43563 samples/s/p 0:44:26 } +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1440/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.0834239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43390 samples/s/p 0:44:24 } +2024-07-26 00:29:16,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1442/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.0810635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43648 samples/s/p 0:44:20 } +2024-07-26 00:29:19,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1444/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.0787043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:19,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43429 samples/s/p 0:44:18 } +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1446/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.0763464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43513 samples/s/p 0:44:15 } +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1448/ 1625], loss: 0.923, per_step_time: 1473ms, lr: 2.073995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43086 samples/s/p 0:44:14 } +2024-07-26 00:29:28,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1450/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.0716423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:28,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43385 samples/s/p 0:44:10 } +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1452/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.0692923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43573 samples/s/p 0:44:06 } +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1454/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 2.0669459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43300 samples/s/p 0:44:04 } +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1456/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 2.0646019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43242 samples/s/p 0:44:01 } +2024-07-26 00:29:40,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1458/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.0622606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:40,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43006 samples/s/p 0:44:00 } +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1460/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.059921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43577 samples/s/p 0:43:54 } +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1462/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 2.0575849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43867 samples/s/p 0:43:50 } +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1464/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.0552507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43399 samples/s/p 0:43:49 } +2024-07-26 00:29:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1466/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.0529178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.42901 samples/s/p 0:43:48 } +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1468/ 1625], loss: 1.038, per_step_time: 1473ms, lr: 2.0505895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43073 samples/s/p 0:43:45 } +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1470/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.048264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43057 samples/s/p 0:43:42 } +2024-07-26 00:30:00,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1472/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.045938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:00,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42994 samples/s/p 0:43:39 } +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1474/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.0436166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42932 samples/s/p 0:43:36 } +2024-07-26 00:30:06,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1476/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.0412986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43061 samples/s/p 0:43:33 } +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1478/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 2.0389798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:09,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44082 samples/s/p 0:43:25 } +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1480/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.0366654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43750 samples/s/p 0:43:24 } +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.034355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44133 samples/s/p 0:43:19 } +2024-07-26 00:30:18,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1484/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.032044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43918 samples/s/p 0:43:17 } +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1486/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0297382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:21,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44110 samples/s/p 0:43:13 } +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1488/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.0274342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43603 samples/s/p 0:43:13 } +2024-07-26 00:30:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1490/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.025131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43968 samples/s/p 0:43:08 } +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1492/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.0228326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43601 samples/s/p 0:43:07 } +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1494/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0205355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43705 samples/s/p 0:43:03 } +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1496/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.0182401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.44196 samples/s/p 0:42:58 } +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1498/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.0159487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43676 samples/s/p 0:42:58 } +2024-07-26 00:30:41,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1500/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.0136595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:41,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43717 samples/s/p 0:42:54 } +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1502/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0113716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43451 samples/s/p 0:42:53 } +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1504/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.0090874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.44049 samples/s/p 0:42:47 } +2024-07-26 00:30:50,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1506/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.0068057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:50,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43929 samples/s/p 0:42:45 } +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1508/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.0045259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43779 samples/s/p 0:42:42 } +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1510/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.0022485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43948 samples/s/p 0:42:39 } +2024-07-26 00:30:59,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1512/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.9999738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:59,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43573 samples/s/p 0:42:37 } +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1514/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.9977024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43751 samples/s/p 0:42:34 } +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1516/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 1.9954318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.44007 samples/s/p 0:42:29 } +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1518/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.9931658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:08,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43013 samples/s/p 0:42:31 } +2024-07-26 00:31:11,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1520/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.9909023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:11,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44043 samples/s/p 0:42:23 } +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1522/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.988638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43591 samples/s/p 0:42:23 } +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1524/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9863796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44166 samples/s/p 0:42:17 } +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1526/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9841232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44089 samples/s/p 0:42:14 } +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1528/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.9818672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43576 samples/s/p 0:42:14 } +2024-07-26 00:31:26,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1530/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9796166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:26,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43759 samples/s/p 0:42:10 } +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1532/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.977366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43434 samples/s/p 0:42:09 } +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1534/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.9751183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.42805 samples/s/p 0:42:09 } +2024-07-26 00:31:35,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1536/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.9728745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:35,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43538 samples/s/p 0:42:02 } +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1538/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.9706317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43244 samples/s/p 0:42:01 } +2024-07-26 00:31:40,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1540/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.9683916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:40,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43340 samples/s/p 0:41:57 } +2024-07-26 00:31:43,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1542/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 1.9661557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:43,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43105 samples/s/p 0:41:55 } +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1544/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.9639208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.42852 samples/s/p 0:41:54 } +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1546/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.9616884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43189 samples/s/p 0:41:49 } +2024-07-26 00:31:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1548/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.9594595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.44188 samples/s/p 0:41:42 } +2024-07-26 00:31:55,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1550/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 1.9572321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:55,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43696 samples/s/p 0:41:41 } +2024-07-26 00:31:58,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1552/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.9550075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:58,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43124 samples/s/p 0:41:41 } +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1554/ 1625], loss: 0.970, per_step_time: 1471ms, lr: 1.9527856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43790 samples/s/p 0:41:35 } +2024-07-26 00:32:04,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1556/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9505653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:04,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43536 samples/s/p 0:41:33 } +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1558/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.9483475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43713 samples/s/p 0:41:29 } +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1560/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.9461334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43080 samples/s/p 0:41:29 } +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1562/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.9439217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.44034 samples/s/p 0:41:22 } +2024-07-26 00:32:16,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1564/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.941711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:16,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43147 samples/s/p 0:41:23 } +2024-07-26 00:32:19,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1566/ 1625], loss: 1.263, per_step_time: 1476ms, lr: 1.9395043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:19,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.41944 samples/s/p 0:41:25 } +2024-07-26 00:32:22,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1568/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.9372997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43462 samples/s/p 0:41:15 } +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1570/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.9350991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43807 samples/s/p 0:41:11 } +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1572/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.932897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:28,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43380 samples/s/p 0:41:10 } +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1574/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.9307017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43601 samples/s/p 0:41:06 } +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1576/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9285076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43696 samples/s/p 0:41:03 } +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1578/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.926313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43850 samples/s/p 0:40:59 } +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1580/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.9241247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43480 samples/s/p 0:40:58 } +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1582/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.921938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:42,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43241 samples/s/p 0:40:56 } +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1584/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9197541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43574 samples/s/p 0:40:51 } +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1586/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.917571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.44015 samples/s/p 0:40:46 } +2024-07-26 00:32:51,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1588/ 1625], loss: 1.420, per_step_time: 1471ms, lr: 1.9153913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:51,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43721 samples/s/p 0:40:45 } +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1590/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.913215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43603 samples/s/p 0:40:42 } +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.9110398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43811 samples/s/p 0:40:39 } +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1594/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.908868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43953 samples/s/p 0:40:35 } +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1596/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.9066994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:03,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43490 samples/s/p 0:40:34 } +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1598/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.904531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.42806 samples/s/p 0:40:34 } +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1600/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.9023669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43253 samples/s/p 0:40:29 } +2024-07-26 00:33:12,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1602/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.9002052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:12,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43380 samples/s/p 0:40:26 } +2024-07-26 00:33:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1604/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.8980454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43540 samples/s/p 0:40:22 } +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1606/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.8958883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43448 samples/s/p 0:40:20 } +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1608/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 1.8937328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43547 samples/s/p 0:40:16 } +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1610/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 1.8915816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43301 samples/s/p 0:40:14 } +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1612/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.8894331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43345 samples/s/p 0:40:11 } +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1614/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.8872854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43448 samples/s/p 0:40:08 } +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1616/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.8851403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.42771 samples/s/p 0:40:08 } +2024-07-26 00:33:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1618/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.8829994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:36,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43004 samples/s/p 0:40:04 } +2024-07-26 00:33:39,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1620/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.8808604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43794 samples/s/p 0:39:57 } +2024-07-26 00:33:41,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1622/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.8787222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:41,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43608 samples/s/p 0:39:55 } +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1624/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.8765884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43821 samples/s/p 0:39:51 } +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.874457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:47,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43533 samples/s/p 0:39:50 } +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 3/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.8723283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43394 samples/s/p 0:39:47 } +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 5/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8702005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43267 samples/s/p 0:39:45 } +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 7/ 1625], loss: 1.157, per_step_time: 1475ms, lr: 1.8680762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.42371 samples/s/p 0:39:46 } +2024-07-26 00:33:59,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 9/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.8659543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:59,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43408 samples/s/p 0:39:39 } +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 11/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.8638343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44013 samples/s/p 0:39:33 } +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 13/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 1.8617186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.42463 samples/s/p 0:39:37 } +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 15/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.8596038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44035 samples/s/p 0:39:27 } +2024-07-26 00:34:11,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 17/ 1625], loss: 0.964, per_step_time: 1470ms, lr: 1.8574915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:11,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43932 samples/s/p 0:39:24 } +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 19/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.8553835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43356 samples/s/p 0:39:24 } +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 21/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 1.8532755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44262 samples/s/p 0:39:17 } +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 23/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.8511719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43409 samples/s/p 0:39:18 } +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 25/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.84907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43330 samples/s/p 0:39:15 } +2024-07-26 00:34:26,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 27/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 1.8469707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:26,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43692 samples/s/p 0:39:11 } +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 29/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8448749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43056 samples/s/p 0:39:11 } +2024-07-26 00:34:32,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 31/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.8427816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:32,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43551 samples/s/p 0:39:06 } +2024-07-26 00:34:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 33/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.8406874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:35,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43626 samples/s/p 0:39:02 } +2024-07-26 00:34:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 35/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.8385986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:38,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43629 samples/s/p 0:38:59 } +2024-07-26 00:34:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 37/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.836514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43557 samples/s/p 0:38:57 } +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 39/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.8344285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43751 samples/s/p 0:38:53 } +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 41/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.8323465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43451 samples/s/p 0:38:51 } +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 43/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.8302687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43520 samples/s/p 0:38:48 } +2024-07-26 00:34:52,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 45/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.8281928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:52,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43810 samples/s/p 0:38:44 } +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 47/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.8261185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43044 samples/s/p 0:38:44 } +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 49/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8240469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43265 samples/s/p 0:38:40 } +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 51/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.8219787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43426 samples/s/p 0:38:37 } +2024-07-26 00:35:04,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 53/ 1625], loss: 1.175, per_step_time: 1474ms, lr: 1.8199123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:04,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.42641 samples/s/p 0:38:37 } +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 55/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.8178475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43721 samples/s/p 0:38:30 } +2024-07-26 00:35:10,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 57/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 1.8157862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:10,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.44111 samples/s/p 0:38:25 } +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 59/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.8137284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43663 samples/s/p 0:38:24 } +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 61/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.8116714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43140 samples/s/p 0:38:23 } +2024-07-26 00:35:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 63/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.8096171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:19,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43393 samples/s/p 0:38:19 } +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 65/ 1625], loss: 0.928, per_step_time: 1472ms, lr: 1.8075671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43176 samples/s/p 0:38:17 } +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 67/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.8055188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42734 samples/s/p 0:38:16 } +2024-07-26 00:35:28,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 69/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 1.8034722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:28,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42477 samples/s/p 0:38:14 } +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 71/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.8014273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42798 samples/s/p 0:38:10 } +2024-07-26 00:35:34,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 73/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.7993868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:34,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43544 samples/s/p 0:38:04 } +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 75/ 1625], loss: 0.976, per_step_time: 1474ms, lr: 1.7973497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42553 samples/s/p 0:38:05 } +2024-07-26 00:35:40,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 77/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7953125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:40,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43710 samples/s/p 0:37:57 } +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 79/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 1.793279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43396 samples/s/p 0:37:56 } +2024-07-26 00:35:45,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 81/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.7912497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:45,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43403 samples/s/p 0:37:53 } +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 83/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.7892187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43233 samples/s/p 0:37:50 } +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 85/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7871937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43059 samples/s/p 0:37:48 } +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 87/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.7851713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43124 samples/s/p 0:37:45 } +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 89/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.783149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:57,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42831 samples/s/p 0:37:43 } +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 91/ 1625], loss: 0.966, per_step_time: 1469ms, lr: 1.7811317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.44314 samples/s/p 0:37:34 } +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 93/ 1625], loss: 1.217, per_step_time: 1478ms, lr: 1.7791153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.41255 samples/s/p 0:37:44 } +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 95/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.7771025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.42906 samples/s/p 0:37:34 } +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 97/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.7750922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43902 samples/s/p 0:37:27 } +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 99/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.7730837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43599 samples/s/p 0:37:25 } +2024-07-26 00:36:15,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 101/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7710777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43751 samples/s/p 0:37:22 } +2024-07-26 00:36:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 103/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.7690743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43913 samples/s/p 0:37:18 } +2024-07-26 00:36:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 105/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7670752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43328 samples/s/p 0:37:18 } +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 107/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 1.7650761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43527 samples/s/p 0:37:14 } +2024-07-26 00:36:27,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 109/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.7630806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:27,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43546 samples/s/p 0:37:11 } +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 111/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7610876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43031 samples/s/p 0:37:10 } +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 113/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.759098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43095 samples/s/p 0:37:07 } +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 115/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.7571094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43281 samples/s/p 0:37:03 } +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 117/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.7551233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:39,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43768 samples/s/p 0:36:58 } +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 119/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7531424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43171 samples/s/p 0:36:58 } +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 121/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.7511607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43927 samples/s/p 0:36:52 } +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 123/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.7491832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43602 samples/s/p 0:36:50 } +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 125/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.7472075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43698 samples/s/p 0:36:47 } +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 127/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.7452353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:53,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43605 samples/s/p 0:36:44 } +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 129/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7432646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.44070 samples/s/p 0:36:39 } +2024-07-26 00:36:59,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 131/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.7412976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43756 samples/s/p 0:36:38 } +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 133/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.7393314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43758 samples/s/p 0:36:35 } +2024-07-26 00:37:05,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 135/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 1.7373695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:05,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.42995 samples/s/p 0:36:35 } +2024-07-26 00:37:08,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 137/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.7354103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:08,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43163 samples/s/p 0:36:31 } +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 139/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.733451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:11,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43577 samples/s/p 0:36:26 } +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 141/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.7314977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43578 samples/s/p 0:36:24 } +2024-07-26 00:37:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 143/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.7295454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43145 samples/s/p 0:36:22 } +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 145/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7275947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43007 samples/s/p 0:36:20 } +2024-07-26 00:37:23,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 147/ 1625], loss: 0.965, per_step_time: 1474ms, lr: 1.7256475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:23,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42468 samples/s/p 0:36:19 } +2024-07-26 00:37:26,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 149/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 1.7237029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:26,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43157 samples/s/p 0:36:13 } +2024-07-26 00:37:29,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 151/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.7217609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:29,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42977 samples/s/p 0:36:11 } +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 153/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.7198215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43256 samples/s/p 0:36:07 } +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 155/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7178838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43387 samples/s/p 0:36:04 } +2024-07-26 00:37:38,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 157/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.7159505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:38,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43887 samples/s/p 0:35:59 } +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 159/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.7140179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43347 samples/s/p 0:35:58 } +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 161/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.712088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:43,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43797 samples/s/p 0:35:53 } +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 163/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.7101625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43690 samples/s/p 0:35:51 } +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 165/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.7082368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:49,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43435 samples/s/p 0:35:49 } +2024-07-26 00:37:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 167/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.7063146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:52,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43625 samples/s/p 0:35:45 } +2024-07-26 00:37:55,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 169/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.7043969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:55,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43126 samples/s/p 0:35:44 } +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 171/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.702479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43460 samples/s/p 0:35:40 } +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 173/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.7005664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:01,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43708 samples/s/p 0:35:36 } +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 175/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6986538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43351 samples/s/p 0:35:34 } +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 177/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 1.6967438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43390 samples/s/p 0:35:31 } +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 179/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 1.6948381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44003 samples/s/p 0:35:26 } +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 181/ 1625], loss: 1.048, per_step_time: 1469ms, lr: 1.6929341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44384 samples/s/p 0:35:22 } +2024-07-26 00:38:16,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 183/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.691031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:16,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43935 samples/s/p 0:35:20 } +2024-07-26 00:38:19,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 185/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.6891331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:19,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43480 samples/s/p 0:35:19 } +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 187/ 1625], loss: 1.160, per_step_time: 1475ms, lr: 1.6872377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42331 samples/s/p 0:35:21 } +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 189/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.6853432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43451 samples/s/p 0:35:13 } +2024-07-26 00:38:28,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 191/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6834522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43212 samples/s/p 0:35:11 } +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 193/ 1625], loss: 1.224, per_step_time: 1474ms, lr: 1.6815638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:31,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42558 samples/s/p 0:35:11 } +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 195/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.6796771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43724 samples/s/p 0:35:04 } +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 197/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 1.6777931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43295 samples/s/p 0:35:02 } +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 199/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 1.6759124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43540 samples/s/p 0:34:58 } +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 201/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.6740352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.44145 samples/s/p 0:34:53 } +2024-07-26 00:38:45,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 203/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.6721572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:45,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43360 samples/s/p 0:34:53 } +2024-07-26 00:38:48,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 205/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 1.6702834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:48,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43177 samples/s/p 0:34:51 } +2024-07-26 00:38:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 207/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.6684139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43467 samples/s/p 0:34:47 } +2024-07-26 00:38:54,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 209/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.6665446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:54,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43651 samples/s/p 0:34:43 } +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 211/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 1.6646795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43015 samples/s/p 0:34:43 } +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 213/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.662817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.42971 samples/s/p 0:34:40 } +2024-07-26 00:39:03,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 215/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:03,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43551 samples/s/p 0:34:35 } +2024-07-26 00:39:06,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 217/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.659098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:06,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.44131 samples/s/p 0:34:30 } +2024-07-26 00:39:09,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 219/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.6572433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:09,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43502 samples/s/p 0:34:29 } +2024-07-26 00:39:12,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 221/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.6553886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:12,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43229 samples/s/p 0:34:27 } +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 223/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.6535391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43606 samples/s/p 0:34:23 } +2024-07-26 00:39:18,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 225/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.6516913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:18,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.44088 samples/s/p 0:34:18 } +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 227/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.6498452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43021 samples/s/p 0:34:19 } +2024-07-26 00:39:24,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 229/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.6480035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:24,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43525 samples/s/p 0:34:14 } +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 231/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.6461626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:27,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43376 samples/s/p 0:34:12 } +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 233/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.644326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:30,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43615 samples/s/p 0:34:08 } +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 235/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.6424902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43925 samples/s/p 0:34:04 } +2024-07-26 00:39:36,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 237/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.6406572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:36,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43358 samples/s/p 0:34:03 } +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 239/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6388275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43855 samples/s/p 0:33:58 } +2024-07-26 00:39:42,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 241/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.6369995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:42,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43745 samples/s/p 0:33:56 } +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 243/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.6351751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43574 samples/s/p 0:33:53 } +2024-07-26 00:39:47,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 245/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.6333532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:47,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43792 samples/s/p 0:33:50 } +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 247/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.6315331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43991 samples/s/p 0:33:46 } +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 249/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.6297164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43345 samples/s/p 0:33:45 } +2024-07-26 00:39:56,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 251/ 1625], loss: 1.268, per_step_time: 1473ms, lr: 1.6279023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:56,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43051 samples/s/p 0:33:44 } +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 253/ 1625], loss: 0.906, per_step_time: 1472ms, lr: 1.626089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43116 samples/s/p 0:33:40 } +2024-07-26 00:40:02,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 255/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 1.6242784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:02,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43051 samples/s/p 0:33:38 } +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 257/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.6224739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43542 samples/s/p 0:33:33 } +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 259/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 1.6206675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43671 samples/s/p 0:33:30 } +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 261/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.618868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43713 samples/s/p 0:33:26 } +2024-07-26 00:40:14,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 263/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.6170687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43727 samples/s/p 0:33:23 } +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 265/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.6152701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43727 samples/s/p 0:33:21 } +2024-07-26 00:40:20,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 267/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.6134777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:20,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43959 samples/s/p 0:33:17 } +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 269/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.611686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:23,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43664 samples/s/p 0:33:15 } +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 271/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.609897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43309 samples/s/p 0:33:13 } +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 273/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6081106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43309 samples/s/p 0:33:10 } +2024-07-26 00:40:32,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 275/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6063259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43758 samples/s/p 0:33:06 } +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 277/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.6045447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43973 samples/s/p 0:33:02 } +2024-07-26 00:40:38,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 279/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.6027659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:38,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44070 samples/s/p 0:32:59 } +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 281/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.6009908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44100 samples/s/p 0:32:56 } +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 283/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.5992164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43659 samples/s/p 0:32:54 } +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 285/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.5974456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43664 samples/s/p 0:32:51 } +2024-07-26 00:40:49,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 287/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.5956773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:49,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43907 samples/s/p 0:32:47 } +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 289/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.5939098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43108 samples/s/p 0:32:47 } +2024-07-26 00:40:55,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 291/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.5921476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:55,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43367 samples/s/p 0:32:44 } +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 293/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.590387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:58,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43825 samples/s/p 0:32:39 } +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 295/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.5886292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43925 samples/s/p 0:32:36 } +2024-07-26 00:41:04,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 297/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5868729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:04,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43340 samples/s/p 0:32:35 } +2024-07-26 00:41:07,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 299/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.5851193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:07,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43037 samples/s/p 0:32:33 } +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 301/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.58337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:10,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43460 samples/s/p 0:32:28 } +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 303/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.5816208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43790 samples/s/p 0:32:24 } +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 305/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.5798759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:16,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44068 samples/s/p 0:32:20 } +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 307/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.5781335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:19,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43674 samples/s/p 0:32:19 } +2024-07-26 00:41:22,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 309/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 1.5763919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:22,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43084 samples/s/p 0:32:18 } +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 311/ 1625], loss: 0.902, per_step_time: 1470ms, lr: 1.5746565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44141 samples/s/p 0:32:11 } +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 313/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 1.5729202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44179 samples/s/p 0:32:08 } +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 315/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.5711882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:31,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43449 samples/s/p 0:32:08 } +2024-07-26 00:41:34,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 317/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5694588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:34,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43676 samples/s/p 0:32:04 } +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 319/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.5677294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43804 samples/s/p 0:32:01 } +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 321/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 1.5660053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43425 samples/s/p 0:31:59 } +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 323/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 1.5642827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43276 samples/s/p 0:31:57 } +2024-07-26 00:41:45,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 325/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.5625645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43931 samples/s/p 0:31:52 } +2024-07-26 00:41:48,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 327/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.5608464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:48,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43079 samples/s/p 0:31:52 } +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 329/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 1.5591326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43606 samples/s/p 0:31:47 } +2024-07-26 00:41:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 331/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.5574204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:54,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43604 samples/s/p 0:31:44 } +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 333/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.55571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43755 samples/s/p 0:31:40 } +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 335/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.554004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43428 samples/s/p 0:31:39 } +2024-07-26 00:42:03,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 337/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5523005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:03,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43550 samples/s/p 0:31:35 } +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 339/ 1625], loss: 0.954, per_step_time: 1473ms, lr: 1.5505988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.42922 samples/s/p 0:31:34 } +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 341/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.5488988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43812 samples/s/p 0:31:28 } +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 343/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.547204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43918 samples/s/p 0:31:25 } +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 345/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.54551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:15,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43259 samples/s/p 0:31:24 } +2024-07-26 00:42:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 347/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.5438169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43446 samples/s/p 0:31:21 } +2024-07-26 00:42:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 349/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.542129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43248 samples/s/p 0:31:19 } +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 351/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5404419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43245 samples/s/p 0:31:16 } +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 353/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 1.5387584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43449 samples/s/p 0:31:12 } +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 355/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 1.5370773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43178 samples/s/p 0:31:10 } +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.535399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:33,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.44144 samples/s/p 0:31:04 } +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 359/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.5337239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43924 samples/s/p 0:31:02 } +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 361/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5320508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43547 samples/s/p 0:31:00 } +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 363/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 1.5303801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43818 samples/s/p 0:30:56 } +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 365/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 1.5287121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.42552 samples/s/p 0:30:57 } +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 367/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.5270457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43404 samples/s/p 0:30:52 } +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 369/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.5253838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43537 samples/s/p 0:30:48 } +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 371/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.5237226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43574 samples/s/p 0:30:45 } +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 373/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.5220651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43340 samples/s/p 0:30:43 } +2024-07-26 00:42:59,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 375/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.5204091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:59,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43362 samples/s/p 0:30:40 } +2024-07-26 00:43:02,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 377/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5187566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:02,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43146 samples/s/p 0:30:38 } +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 379/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5171067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43774 samples/s/p 0:30:33 } +2024-07-26 00:43:08,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 381/ 1625], loss: 1.298, per_step_time: 1470ms, lr: 1.5154585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:08,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.44093 samples/s/p 0:30:29 } +2024-07-26 00:43:11,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 383/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.5138147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42901 samples/s/p 0:30:30 } +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 385/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.5121725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.44132 samples/s/p 0:30:23 } +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 387/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5105331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43291 samples/s/p 0:30:22 } +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 389/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.5088945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43260 samples/s/p 0:30:20 } +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 391/ 1625], loss: 0.913, per_step_time: 1471ms, lr: 1.5072601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43552 samples/s/p 0:30:16 } +2024-07-26 00:43:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 393/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5056283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43709 samples/s/p 0:30:12 } +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 395/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.5039984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43774 samples/s/p 0:30:09 } +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 397/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.5023718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42378 samples/s/p 0:30:11 } +2024-07-26 00:43:35,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 399/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 1.5007479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:35,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43982 samples/s/p 0:30:03 } +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 401/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.4991265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43586 samples/s/p 0:30:01 } +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 403/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.4975077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43643 samples/s/p 0:29:58 } +2024-07-26 00:43:43,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 405/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.4958907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:43,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43589 samples/s/p 0:29:55 } +2024-07-26 00:43:46,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 407/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.4942771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:46,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43846 samples/s/p 0:29:51 } +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 409/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 1.4926661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.44034 samples/s/p 0:29:48 } +2024-07-26 00:43:52,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 411/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.4910568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:52,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43724 samples/s/p 0:29:46 } +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 413/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.489451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:55,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43896 samples/s/p 0:29:42 } +2024-07-26 00:43:58,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 415/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.4878469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:58,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43211 samples/s/p 0:29:41 } +2024-07-26 00:44:01,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 417/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.4862454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:01,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44023 samples/s/p 0:29:36 } +2024-07-26 00:44:04,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 419/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.4846482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:04,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43641 samples/s/p 0:29:34 } +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 421/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.4830528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43815 samples/s/p 0:29:31 } +2024-07-26 00:44:10,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 423/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.4814591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:10,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43507 samples/s/p 0:29:29 } +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 425/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.4798671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:13,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44441 samples/s/p 0:29:23 } +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 427/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.4782795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43604 samples/s/p 0:29:23 } +2024-07-26 00:44:19,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 429/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.4766936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:19,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43536 samples/s/p 0:29:20 } +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 431/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.475112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43475 samples/s/p 0:29:17 } +2024-07-26 00:44:25,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 433/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.4735303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:25,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43216 samples/s/p 0:29:15 } +2024-07-26 00:44:28,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 435/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.471953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:28,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43495 samples/s/p 0:29:11 } +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 437/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4703784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43030 samples/s/p 0:29:10 } +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 439/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 1.4688054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42881 samples/s/p 0:29:07 } +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 441/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.4672358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43733 samples/s/p 0:29:02 } +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 443/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 1.4656689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43064 samples/s/p 0:29:01 } +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 445/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.4641038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43125 samples/s/p 0:28:58 } +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.4625411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:45,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43691 samples/s/p 0:28:53 } +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 449/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.4609811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43706 samples/s/p 0:28:50 } +2024-07-26 00:44:51,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 451/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.4594247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:51,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43391 samples/s/p 0:28:48 } +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 453/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.4578698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43062 samples/s/p 0:28:46 } +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 455/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.4563193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43252 samples/s/p 0:28:42 } +2024-07-26 00:45:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 457/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4547705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:00,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43607 samples/s/p 0:28:38 } +2024-07-26 00:45:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 459/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 1.4532227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.42545 samples/s/p 0:28:39 } +2024-07-26 00:45:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 461/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.451679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:06,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43800 samples/s/p 0:28:32 } +2024-07-26 00:45:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 463/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 1.4501372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:09,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43872 samples/s/p 0:28:29 } +2024-07-26 00:45:12,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 465/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.4485988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43848 samples/s/p 0:28:26 } +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 467/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.447063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43418 samples/s/p 0:28:24 } +2024-07-26 00:45:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 469/ 1625], loss: 0.997, per_step_time: 1469ms, lr: 1.4455297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44261 samples/s/p 0:28:19 } +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 471/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4439984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43148 samples/s/p 0:28:19 } +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 473/ 1625], loss: 1.298, per_step_time: 1469ms, lr: 1.4424686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44410 samples/s/p 0:28:12 } +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 475/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.4409432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43249 samples/s/p 0:28:13 } +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 477/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.4394203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:30,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43420 samples/s/p 0:28:10 } +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 479/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4378983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44132 samples/s/p 0:28:04 } +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 481/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.4363816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43433 samples/s/p 0:28:04 } +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 483/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.4348656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43838 samples/s/p 0:27:59 } +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 485/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.433354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43035 samples/s/p 0:27:59 } +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 487/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 1.4318424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43975 samples/s/p 0:27:53 } +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 489/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.4303342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43782 samples/s/p 0:27:51 } +2024-07-26 00:45:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 491/ 1625], loss: 1.108, per_step_time: 1477ms, lr: 1.4288304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.41375 samples/s/p 0:27:55 } +2024-07-26 00:45:53,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 493/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.4273274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:53,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43101 samples/s/p 0:27:47 } +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 495/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.4258262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.44165 samples/s/p 0:27:41 } +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 497/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.4243302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43769 samples/s/p 0:27:39 } +2024-07-26 00:46:02,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 499/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.4228359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43561 samples/s/p 0:27:37 } +2024-07-26 00:46:05,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.4213441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:05,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.42050 samples/s/p 0:27:38 } +2024-07-26 00:46:08,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 503/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 1.4198541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:08,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43570 samples/s/p 0:27:31 } +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 505/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 1.4183668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43790 samples/s/p 0:27:27 } +2024-07-26 00:46:14,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 507/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4168819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:14,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43356 samples/s/p 0:27:26 } +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 509/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.4154006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43941 samples/s/p 0:27:21 } +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 511/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.4139218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43658 samples/s/p 0:27:19 } +2024-07-26 00:46:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 513/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.4124456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43406 samples/s/p 0:27:17 } +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 515/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.4109712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:26,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43711 samples/s/p 0:27:13 } +2024-07-26 00:46:29,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 517/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4094985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:29,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43171 samples/s/p 0:27:11 } +2024-07-26 00:46:32,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 519/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.4080318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:32,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42624 samples/s/p 0:27:10 } +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 521/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.4065643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42984 samples/s/p 0:27:06 } +2024-07-26 00:46:38,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 523/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.405102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:38,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42630 samples/s/p 0:27:04 } +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 525/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.4036414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43382 samples/s/p 0:26:59 } +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 527/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.4021816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43919 samples/s/p 0:26:54 } +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 529/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 1.4007279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.44236 samples/s/p 0:26:51 } +2024-07-26 00:46:49,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 531/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.3992742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:49,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43701 samples/s/p 0:26:49 } +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 533/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.3978214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43296 samples/s/p 0:26:47 } +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 535/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3963754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43758 samples/s/p 0:26:43 } +2024-07-26 00:46:58,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 537/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.3949305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:58,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43762 samples/s/p 0:26:40 } +2024-07-26 00:47:01,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 539/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.3934862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:01,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43113 samples/s/p 0:26:39 } +2024-07-26 00:47:04,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 541/ 1625], loss: 1.221, per_step_time: 1475ms, lr: 1.3920463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:04,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.42168 samples/s/p 0:26:39 } +2024-07-26 00:47:07,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 543/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.3906099e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43806 samples/s/p 0:26:31 } +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 545/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 1.3891744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43611 samples/s/p 0:26:29 } +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 547/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.3877423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.44294 samples/s/p 0:26:24 } +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 549/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3863128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:16,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43633 samples/s/p 0:26:23 } +2024-07-26 00:47:19,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 551/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.3848859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:19,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43650 samples/s/p 0:26:20 } +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 553/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.3834616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43743 samples/s/p 0:26:17 } +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 555/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.3820398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43278 samples/s/p 0:26:15 } +2024-07-26 00:47:28,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 557/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3806199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:28,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43710 samples/s/p 0:26:11 } +2024-07-26 00:47:31,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 559/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.3792041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:31,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43287 samples/s/p 0:26:09 } +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 561/ 1625], loss: 1.045, per_step_time: 1469ms, lr: 1.3777885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:34,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44434 samples/s/p 0:26:03 } +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 563/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.3763797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43529 samples/s/p 0:26:03 } +2024-07-26 00:47:40,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 565/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 1.3749693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:40,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43198 samples/s/p 0:26:01 } +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 567/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 1.3735623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43248 samples/s/p 0:25:58 } +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 569/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 1.3721605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43649 samples/s/p 0:25:53 } +2024-07-26 00:47:48,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 571/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 1.3707577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:48,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43822 samples/s/p 0:25:50 } +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 573/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.3693602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44049 samples/s/p 0:25:46 } +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 575/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 1.3679644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.42946 samples/s/p 0:25:47 } +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 577/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 1.3665704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:57,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43441 samples/s/p 0:25:42 } +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 579/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.3651814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44055 samples/s/p 0:25:38 } +2024-07-26 00:48:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 581/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3637925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43445 samples/s/p 0:25:36 } +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 583/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.362408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43743 samples/s/p 0:25:33 } +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 585/ 1625], loss: 0.924, per_step_time: 1469ms, lr: 1.3610252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:09,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44332 samples/s/p 0:25:28 } +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 587/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3596441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43776 samples/s/p 0:25:27 } +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 589/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.3582674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:15,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42817 samples/s/p 0:25:26 } +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 591/ 1625], loss: 1.248, per_step_time: 1474ms, lr: 1.3568914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42421 samples/s/p 0:25:25 } +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 593/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.355519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43685 samples/s/p 0:25:18 } +2024-07-26 00:48:24,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 595/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.35415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:24,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42958 samples/s/p 0:25:17 } +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 597/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.3527826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:27,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43203 samples/s/p 0:25:13 } +2024-07-26 00:48:30,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 599/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.3514189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:30,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42733 samples/s/p 0:25:12 } +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 601/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.3500568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43693 samples/s/p 0:25:06 } +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 603/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.3486964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43467 samples/s/p 0:25:04 } +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 605/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.3473405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43460 samples/s/p 0:25:01 } +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 607/ 1625], loss: 1.273, per_step_time: 1470ms, lr: 1.3459869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.44093 samples/s/p 0:24:56 } +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 609/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.3446352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43625 samples/s/p 0:24:55 } +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 611/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.343287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43085 samples/s/p 0:24:53 } +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 613/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.3419404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.44161 samples/s/p 0:24:47 } +2024-07-26 00:48:53,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 615/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.3405966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:53,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43807 samples/s/p 0:24:45 } +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 617/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.3392552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:56,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43750 samples/s/p 0:24:43 } +2024-07-26 00:48:59,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 619/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.3379181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:59,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43218 samples/s/p 0:24:41 } +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 621/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3365811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:02,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43414 samples/s/p 0:24:38 } +2024-07-26 00:49:05,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 623/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.3352493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:05,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43603 samples/s/p 0:24:34 } +2024-07-26 00:49:08,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 625/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.3339184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:08,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43903 samples/s/p 0:24:30 } +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 627/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.3325899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43598 samples/s/p 0:24:28 } +2024-07-26 00:49:14,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 629/ 1625], loss: 1.174, per_step_time: 1469ms, lr: 1.331265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:14,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44291 samples/s/p 0:24:23 } +2024-07-26 00:49:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 631/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.3299427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43489 samples/s/p 0:24:23 } +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 633/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.3286221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43561 samples/s/p 0:24:20 } +2024-07-26 00:49:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 635/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.3273041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43578 samples/s/p 0:24:17 } +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 637/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.3259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43887 samples/s/p 0:24:13 } +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 639/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.3246776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:29,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44144 samples/s/p 0:24:09 } +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 641/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.3233682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:32,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43255 samples/s/p 0:24:09 } +2024-07-26 00:49:35,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 643/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.3220614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.44217 samples/s/p 0:24:03 } +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 645/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.3207564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43325 samples/s/p 0:24:02 } +2024-07-26 00:49:41,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 647/ 1625], loss: 1.140, per_step_time: 1482ms, lr: 1.319454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.39545 samples/s/p 0:24:10 } +2024-07-26 00:49:43,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 649/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3181567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:43,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43295 samples/s/p 0:23:57 } +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 651/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.3168603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.44128 samples/s/p 0:23:52 } +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 653/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.3155657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43957 samples/s/p 0:23:49 } +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 655/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.3142752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43459 samples/s/p 0:23:47 } +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 657/ 1625], loss: 1.220, per_step_time: 1474ms, lr: 1.3129866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.42720 samples/s/p 0:23:46 } +2024-07-26 00:49:58,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 659/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3116988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:58,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43235 samples/s/p 0:23:42 } +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 661/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.3104171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43995 samples/s/p 0:23:37 } +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 663/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 1.3091354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43736 samples/s/p 0:23:35 } +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 665/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.3078563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43345 samples/s/p 0:23:33 } +2024-07-26 00:50:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 667/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.3065833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43212 samples/s/p 0:23:30 } +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 669/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3053102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43655 samples/s/p 0:23:26 } +2024-07-26 00:50:16,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 671/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.3040398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:16,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43392 samples/s/p 0:23:24 } +2024-07-26 00:50:19,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 673/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.302771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:19,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43761 samples/s/p 0:23:20 } +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 675/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3015066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43294 samples/s/p 0:23:18 } +2024-07-26 00:50:25,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 677/ 1625], loss: 1.006, per_step_time: 1473ms, lr: 1.3002439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:25,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42929 samples/s/p 0:23:16 } +2024-07-26 00:50:28,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 679/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2989838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:28,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43166 samples/s/p 0:23:13 } +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 681/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.2977271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:31,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43663 samples/s/p 0:23:09 } +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 683/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2964713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43570 samples/s/p 0:23:06 } +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 685/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.295219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43699 samples/s/p 0:23:03 } +2024-07-26 00:50:40,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 687/ 1625], loss: 1.003, per_step_time: 1473ms, lr: 1.2939702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:40,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42869 samples/s/p 0:23:02 } +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 689/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.2927239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43302 samples/s/p 0:22:58 } +2024-07-26 00:50:45,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 691/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.2914802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:45,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43628 samples/s/p 0:22:54 } +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 693/ 1625], loss: 0.969, per_step_time: 1470ms, lr: 1.2902383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43918 samples/s/p 0:22:50 } +2024-07-26 00:50:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 695/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2889989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44076 samples/s/p 0:22:47 } +2024-07-26 00:50:54,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 697/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.2877638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:54,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43808 samples/s/p 0:22:45 } +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 699/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.2865305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43368 samples/s/p 0:22:43 } +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 701/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 1.2852998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44025 samples/s/p 0:22:38 } +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 703/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2840708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:03,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43997 samples/s/p 0:22:35 } +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 705/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.2828461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43509 samples/s/p 0:22:34 } +2024-07-26 00:51:09,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 707/ 1625], loss: 1.046, per_step_time: 1469ms, lr: 1.2816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:09,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44303 samples/s/p 0:22:29 } +2024-07-26 00:51:12,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 709/ 1625], loss: 1.102, per_step_time: 1473ms, lr: 1.2804003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:12,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.42973 samples/s/p 0:22:29 } +2024-07-26 00:51:15,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 711/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 1.2791834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:15,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43454 samples/s/p 0:22:25 } +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 713/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.2779674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:18,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43338 samples/s/p 0:22:22 } +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 715/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.2767548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44083 samples/s/p 0:22:18 } +2024-07-26 00:51:24,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 717/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.2755448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:24,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43325 samples/s/p 0:22:16 } +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 719/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2743375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:27,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43367 samples/s/p 0:22:13 } +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 721/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.2731327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43831 samples/s/p 0:22:09 } +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 723/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.2719313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43255 samples/s/p 0:22:08 } +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 725/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.2707309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:36,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43925 samples/s/p 0:22:03 } +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 727/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.2695356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43918 samples/s/p 0:22:00 } +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 729/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.2683403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43678 samples/s/p 0:21:58 } +2024-07-26 00:51:44,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 731/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2671485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:44,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43213 samples/s/p 0:21:56 } +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 733/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.2659592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43466 samples/s/p 0:21:53 } +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 735/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 1.2647735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43479 samples/s/p 0:21:50 } +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 737/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.2635894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:53,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43469 samples/s/p 0:21:47 } +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 739/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 1.2624089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43199 samples/s/p 0:21:44 } +2024-07-26 00:51:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 741/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.26123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:59,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43357 samples/s/p 0:21:41 } +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 743/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.2600555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.42611 samples/s/p 0:21:40 } +2024-07-26 00:52:05,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 745/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.258881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:05,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43755 samples/s/p 0:21:34 } +2024-07-26 00:52:08,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 747/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.2577107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:08,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43410 samples/s/p 0:21:32 } +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 749/ 1625], loss: 1.090, per_step_time: 1480ms, lr: 1.2565431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.40280 samples/s/p 0:21:37 } +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 751/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.255378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43779 samples/s/p 0:21:25 } +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 753/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2542147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43703 samples/s/p 0:21:23 } +2024-07-26 00:52:20,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 755/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 1.2530548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:20,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43756 samples/s/p 0:21:19 } +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 757/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.2518976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43995 samples/s/p 0:21:16 } +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 759/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.250743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43380 samples/s/p 0:21:14 } +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 761/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.2495917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43130 samples/s/p 0:21:12 } +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 763/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.2484405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43347 samples/s/p 0:21:09 } +2024-07-26 00:52:35,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 765/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.2472946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:35,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43736 samples/s/p 0:21:05 } +2024-07-26 00:52:38,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 767/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.2461494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:38,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43889 samples/s/p 0:21:02 } +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 769/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.2450085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:41,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43821 samples/s/p 0:20:59 } +2024-07-26 00:52:44,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 771/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.2438694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:44,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43462 samples/s/p 0:20:57 } +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 773/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.2427329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43502 samples/s/p 0:20:54 } +2024-07-26 00:52:49,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 775/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.2415982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.44128 samples/s/p 0:20:49 } +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:53:25,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 777/ 1625], loss: 1.305, per_step_time: 1514ms, lr: 1.2404677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:25,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.28167 samples/s/p 0:21:24 } +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 779/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.2393398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43531 samples/s/p 0:20:45 } +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 781/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.2382137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43313 samples/s/p 0:20:42 } +2024-07-26 00:53:34,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 783/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.2370901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:34,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43512 samples/s/p 0:20:39 } +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 785/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.2359692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43748 samples/s/p 0:20:35 } +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 787/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.2348517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43449 samples/s/p 0:20:33 } +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 789/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.2337359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42988 samples/s/p 0:20:31 } +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 791/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2326236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43478 samples/s/p 0:20:27 } +2024-07-26 00:53:49,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 793/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.2315139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:49,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43727 samples/s/p 0:20:24 } +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 795/ 1625], loss: 1.404, per_step_time: 1470ms, lr: 1.2304059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43929 samples/s/p 0:20:20 } +2024-07-26 00:53:55,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 797/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.2293013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:55,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43954 samples/s/p 0:20:17 } +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 799/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.2281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43920 samples/s/p 0:20:14 } +2024-07-26 00:54:01,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 801/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.2271009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:01,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43590 samples/s/p 0:20:12 } +2024-07-26 00:54:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 803/ 1625], loss: 1.184, per_step_time: 1474ms, lr: 1.2260016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:04,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42451 samples/s/p 0:20:12 } +2024-07-26 00:54:07,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 805/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.2249092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:07,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44176 samples/s/p 0:20:05 } +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 807/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.2238168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43375 samples/s/p 0:20:04 } +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 809/ 1625], loss: 1.378, per_step_time: 1470ms, lr: 1.2227285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44012 samples/s/p 0:19:59 } +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 811/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.2216414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43473 samples/s/p 0:19:58 } +2024-07-26 00:54:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 813/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2205584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43578 samples/s/p 0:19:55 } +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 815/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2194764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43780 samples/s/p 0:19:51 } +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 817/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.2183987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44066 samples/s/p 0:19:48 } +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 819/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.2173217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:27,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43578 samples/s/p 0:19:46 } +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 821/ 1625], loss: 1.135, per_step_time: 1469ms, lr: 1.2162501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.44438 samples/s/p 0:19:41 } +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.2151784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42964 samples/s/p 0:19:41 } +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 825/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.214111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43069 samples/s/p 0:19:38 } +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 827/ 1625], loss: 1.006, per_step_time: 1475ms, lr: 1.2130454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42221 samples/s/p 0:19:37 } +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 829/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.2119832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:42,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43955 samples/s/p 0:19:30 } +2024-07-26 00:54:45,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 831/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.2109227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:45,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43352 samples/s/p 0:19:29 } +2024-07-26 00:54:48,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 833/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2098657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:48,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43111 samples/s/p 0:19:26 } +2024-07-26 00:54:51,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 835/ 1625], loss: 0.949, per_step_time: 1475ms, lr: 1.2088104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:51,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42192 samples/s/p 0:19:25 } +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 837/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.2077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43028 samples/s/p 0:19:20 } +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 839/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.2067094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43400 samples/s/p 0:19:17 } +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 841/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2056628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:00,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.44010 samples/s/p 0:19:12 } +2024-07-26 00:55:03,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 843/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.2046196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:03,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43616 samples/s/p 0:19:10 } +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 845/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2035764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43199 samples/s/p 0:19:08 } +2024-07-26 00:55:09,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 847/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.2025375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:09,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43195 samples/s/p 0:19:05 } +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 849/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.2015031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43356 samples/s/p 0:19:02 } +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 851/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.2004693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43890 samples/s/p 0:18:58 } +2024-07-26 00:55:18,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 853/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 1.1994383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:18,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43410 samples/s/p 0:18:56 } +2024-07-26 00:55:20,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 855/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 1.198409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:20,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43859 samples/s/p 0:18:52 } +2024-07-26 00:55:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 857/ 1625], loss: 1.175, per_step_time: 1474ms, lr: 1.1973831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42407 samples/s/p 0:18:52 } +2024-07-26 00:55:26,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 859/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.1963607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:26,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43048 samples/s/p 0:18:48 } +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 861/ 1625], loss: 1.147, per_step_time: 1476ms, lr: 1.1953391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.41883 samples/s/p 0:18:47 } +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 863/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.1943227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.44060 samples/s/p 0:18:40 } +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 865/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.1933064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43611 samples/s/p 0:18:38 } +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 867/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.1922943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43334 samples/s/p 0:18:36 } +2024-07-26 00:55:41,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 869/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.1912848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:41,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43176 samples/s/p 0:18:33 } +2024-07-26 00:55:44,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 871/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1902771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:44,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.42922 samples/s/p 0:18:31 } +2024-07-26 00:55:47,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 873/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.1892737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:47,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43481 samples/s/p 0:18:26 } +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 875/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.188272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43157 samples/s/p 0:18:24 } +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 877/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.1872712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43141 samples/s/p 0:18:21 } +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 879/ 1625], loss: 1.032, per_step_time: 1473ms, lr: 1.1862755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43101 samples/s/p 0:18:18 } +2024-07-26 00:55:59,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 881/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.1852799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:59,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43337 samples/s/p 0:18:15 } +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 883/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.1842894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43380 samples/s/p 0:18:12 } +2024-07-26 00:56:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 885/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 1.1833007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:05,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43355 samples/s/p 0:18:09 } +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 887/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 1.1823155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43803 samples/s/p 0:18:05 } +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 889/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 1.181332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:11,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42702 samples/s/p 0:18:04 } +2024-07-26 00:56:14,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 891/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.180351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:14,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43619 samples/s/p 0:18:00 } +2024-07-26 00:56:17,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 893/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 1.1793726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:17,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43558 samples/s/p 0:17:57 } +2024-07-26 00:56:20,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 895/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 1.178396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:20,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42927 samples/s/p 0:17:55 } +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 897/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.1774246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43389 samples/s/p 0:17:51 } +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 899/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.1764548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43077 samples/s/p 0:17:49 } +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 901/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1754878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:28,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43811 samples/s/p 0:17:45 } +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 903/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.1745224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43468 samples/s/p 0:17:42 } +2024-07-26 00:56:34,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 905/ 1625], loss: 0.961, per_step_time: 1473ms, lr: 1.1735588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:34,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42827 samples/s/p 0:17:41 } +2024-07-26 00:56:37,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 907/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 1.1726003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:37,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43344 samples/s/p 0:17:37 } +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 909/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.1716427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42817 samples/s/p 0:17:35 } +2024-07-26 00:56:43,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 911/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1706876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:43,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43028 samples/s/p 0:17:31 } +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 913/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.169736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43173 samples/s/p 0:17:28 } +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 915/ 1625], loss: 1.259, per_step_time: 1469ms, lr: 1.168788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:49,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.44221 samples/s/p 0:17:23 } +2024-07-26 00:56:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 917/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.1678408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43602 samples/s/p 0:17:21 } +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 919/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 1.1668986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43218 samples/s/p 0:17:19 } +2024-07-26 00:56:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 921/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.1659566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43621 samples/s/p 0:17:16 } +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 923/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.1650188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43765 samples/s/p 0:17:12 } +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 925/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1640828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43203 samples/s/p 0:17:10 } +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 927/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.1631478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43909 samples/s/p 0:17:06 } +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 929/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1622195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43047 samples/s/p 0:17:05 } +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 931/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.1612905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43246 samples/s/p 0:17:02 } +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 933/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.1603656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43087 samples/s/p 0:16:59 } +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 935/ 1625], loss: 1.391, per_step_time: 1475ms, lr: 1.1594426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42263 samples/s/p 0:16:57 } +2024-07-26 00:57:22,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 937/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1585222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43584 samples/s/p 0:16:52 } +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 939/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 1.1576052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43602 samples/s/p 0:16:49 } +2024-07-26 00:57:27,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 941/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.1566899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:27,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43626 samples/s/p 0:16:46 } +2024-07-26 00:57:30,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 943/ 1625], loss: 1.395, per_step_time: 1472ms, lr: 1.1557781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:30,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43346 samples/s/p 0:16:44 } +2024-07-26 00:57:33,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 945/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.1548681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:33,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42963 samples/s/p 0:16:41 } +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 947/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.1539623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42840 samples/s/p 0:16:39 } +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 949/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.1530583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:39,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.44013 samples/s/p 0:16:34 } +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 951/ 1625], loss: 1.334, per_step_time: 1473ms, lr: 1.1521586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.42781 samples/s/p 0:16:33 } +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 953/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.1512581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43342 samples/s/p 0:16:29 } +2024-07-26 00:57:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 955/ 1625], loss: 1.356, per_step_time: 1469ms, lr: 1.1503627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:48,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.44270 samples/s/p 0:16:24 } +2024-07-26 00:57:51,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 957/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.1494699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:51,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43309 samples/s/p 0:16:23 } +2024-07-26 00:57:54,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 959/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.1485771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:54,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43419 samples/s/p 0:16:20 } +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 961/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.1476903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43153 samples/s/p 0:16:17 } +2024-07-26 00:58:00,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 963/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.1468053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:00,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43732 samples/s/p 0:16:14 } +2024-07-26 00:58:03,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 965/ 1625], loss: 0.989, per_step_time: 1471ms, lr: 1.1459211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:03,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43495 samples/s/p 0:16:11 } +2024-07-26 00:58:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 967/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 1.1450413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.42928 samples/s/p 0:16:09 } +2024-07-26 00:58:09,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 969/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.1441632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:09,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43878 samples/s/p 0:16:04 } +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 971/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 1.1432877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43424 samples/s/p 0:16:02 } +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 973/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 1.1424165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43475 samples/s/p 0:15:59 } +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 975/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 1.1415462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44084 samples/s/p 0:15:55 } +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 977/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1406785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43295 samples/s/p 0:15:54 } +2024-07-26 00:58:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 979/ 1625], loss: 1.317, per_step_time: 1470ms, lr: 1.1398151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:24,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44084 samples/s/p 0:15:49 } +2024-07-26 00:58:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 981/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 1.1389534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:26,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43826 samples/s/p 0:15:47 } +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 983/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1380953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43376 samples/s/p 0:15:45 } +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 985/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1372379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:32,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43742 samples/s/p 0:15:41 } +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 987/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.1363849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43407 samples/s/p 0:15:39 } +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 989/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1355327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43442 samples/s/p 0:15:36 } +2024-07-26 00:58:41,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 991/ 1625], loss: 1.498, per_step_time: 1470ms, lr: 1.1346857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:41,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43949 samples/s/p 0:15:32 } +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 993/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.1338395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.44132 samples/s/p 0:15:29 } +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 995/ 1625], loss: 1.396, per_step_time: 1470ms, lr: 1.1329969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43887 samples/s/p 0:15:26 } +2024-07-26 00:58:50,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 997/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.1321551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:50,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43653 samples/s/p 0:15:24 } +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 999/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.1313176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43731 samples/s/p 0:15:21 } +2024-07-26 00:58:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1001/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.1304828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42762 samples/s/p 0:15:19 } +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1003/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1296487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:59,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43543 samples/s/p 0:15:15 } +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1005/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.1288207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43542 samples/s/p 0:15:12 } +2024-07-26 00:59:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1007/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.1279928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:05,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43460 samples/s/p 0:15:09 } +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1009/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.1271692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43734 samples/s/p 0:15:06 } +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1011/ 1625], loss: 1.373, per_step_time: 1474ms, lr: 1.1263472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42514 samples/s/p 0:15:05 } +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1013/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.1255271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:14,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43261 samples/s/p 0:15:01 } +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1015/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.1247112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43521 samples/s/p 0:14:57 } +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1017/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.1238961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44124 samples/s/p 0:14:53 } +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1019/ 1625], loss: 0.968, per_step_time: 1470ms, lr: 1.1230854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43875 samples/s/p 0:14:51 } +2024-07-26 00:59:25,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1021/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.1222766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:25,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42796 samples/s/p 0:14:50 } +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1023/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.1214719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42866 samples/s/p 0:14:47 } +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1025/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.1206673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44041 samples/s/p 0:14:42 } +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1027/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.119867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43654 samples/s/p 0:14:39 } +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1029/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.1190692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43479 samples/s/p 0:14:37 } +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1031/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.1182733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44017 samples/s/p 0:14:33 } +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1033/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.1174816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43477 samples/s/p 0:14:31 } +2024-07-26 00:59:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1035/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 1.1166908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44477 samples/s/p 0:14:26 } +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1037/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 1.1159034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44120 samples/s/p 0:14:24 } +2024-07-26 00:59:52,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1039/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.1151195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:52,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44178 samples/s/p 0:14:21 } +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1041/ 1625], loss: 0.996, per_step_time: 1470ms, lr: 1.1143366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44049 samples/s/p 0:14:18 } +2024-07-26 00:59:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1043/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.1135578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43020 samples/s/p 0:14:17 } +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1045/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.11278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:01,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.42646 samples/s/p 0:14:15 } +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1047/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.1120056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43336 samples/s/p 0:14:11 } +2024-07-26 01:00:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1049/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.1112346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:07,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.44177 samples/s/p 0:14:06 } +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1051/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 1.1104663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43159 samples/s/p 0:14:05 } +2024-07-26 01:00:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1053/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.1096997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:13,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43563 samples/s/p 0:14:01 } +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1055/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.1089375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43329 samples/s/p 0:13:59 } +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1057/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.108176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:19,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43556 samples/s/p 0:13:55 } +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1059/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.1074172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.42645 samples/s/p 0:13:54 } +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1061/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.1066627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43459 samples/s/p 0:13:50 } +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1063/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 1.1059082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43353 samples/s/p 0:13:47 } +2024-07-26 01:00:30,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1065/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.1051579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:30,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42953 samples/s/p 0:13:45 } +2024-07-26 01:00:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1067/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.1044121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42924 samples/s/p 0:13:42 } +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1069/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.1036655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43558 samples/s/p 0:13:38 } +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1071/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.1029247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43474 samples/s/p 0:13:35 } +2024-07-26 01:00:42,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1073/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.1021832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:42,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42869 samples/s/p 0:13:33 } +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1075/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 1.1014486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42992 samples/s/p 0:13:30 } +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1077/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.1007139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43553 samples/s/p 0:13:26 } +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1079/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0999811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43526 samples/s/p 0:13:23 } +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1081/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.0992525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:54,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43712 samples/s/p 0:13:20 } +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1083/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.0985265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43304 samples/s/p 0:13:18 } +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1085/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.0978031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43850 samples/s/p 0:13:14 } +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1087/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43585 samples/s/p 0:13:11 } +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1089/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.0963632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43301 samples/s/p 0:13:09 } +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1091/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.0956476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43812 samples/s/p 0:13:05 } +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1093/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.0949345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43302 samples/s/p 0:13:03 } +2024-07-26 01:01:15,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1095/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.094225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43188 samples/s/p 0:13:00 } +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1097/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0935163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43332 samples/s/p 0:12:57 } +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1099/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 1.0928111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43640 samples/s/p 0:12:54 } +2024-07-26 01:01:24,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1101/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.0921093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:24,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43423 samples/s/p 0:12:51 } +2024-07-26 01:01:26,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1103/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.0914084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:26,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43800 samples/s/p 0:12:47 } +2024-07-26 01:01:29,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.0907135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43792 samples/s/p 0:12:44 } +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1107/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.0900178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43984 samples/s/p 0:12:41 } +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1109/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 1.0893273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43966 samples/s/p 0:12:38 } +2024-07-26 01:01:38,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1111/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0886375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:38,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43464 samples/s/p 0:12:36 } +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1113/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0879496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44145 samples/s/p 0:12:32 } +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1115/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0872668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43817 samples/s/p 0:12:30 } +2024-07-26 01:01:47,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1117/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0865875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:47,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43547 samples/s/p 0:12:27 } +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1119/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 1.0859081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43140 samples/s/p 0:12:25 } +2024-07-26 01:01:53,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1121/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.0852315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.44138 samples/s/p 0:12:20 } +2024-07-26 01:01:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1123/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.084559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43423 samples/s/p 0:12:19 } +2024-07-26 01:01:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1125/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.0838884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:59,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43124 samples/s/p 0:12:16 } +2024-07-26 01:02:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1127/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.0832194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:02,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43608 samples/s/p 0:12:12 } +2024-07-26 01:02:05,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1129/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0825556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:05,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43531 samples/s/p 0:12:10 } +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1131/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.0818919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43518 samples/s/p 0:12:07 } +2024-07-26 01:02:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1133/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 1.0812325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43353 samples/s/p 0:12:04 } +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1135/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.0805747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43997 samples/s/p 0:12:00 } +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1137/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.0799223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.44005 samples/s/p 0:11:57 } +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1139/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.0792688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43508 samples/s/p 0:11:55 } +2024-07-26 01:02:23,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1141/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.0786198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:23,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43715 samples/s/p 0:11:52 } +2024-07-26 01:02:25,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1143/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.0779751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43433 samples/s/p 0:11:49 } +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1145/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.0773304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43793 samples/s/p 0:11:46 } +2024-07-26 01:02:31,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1147/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.076689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:31,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43739 samples/s/p 0:11:43 } +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1149/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.0760511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43435 samples/s/p 0:11:40 } +2024-07-26 01:02:37,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1151/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.0754143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:37,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43399 samples/s/p 0:11:37 } +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1153/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.0747824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43966 samples/s/p 0:11:34 } +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1155/ 1625], loss: 1.252, per_step_time: 1469ms, lr: 1.0741506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:43,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.44259 samples/s/p 0:11:30 } +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1157/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.0735232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43549 samples/s/p 0:11:28 } +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1159/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0728984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43505 samples/s/p 0:11:25 } +2024-07-26 01:02:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1161/ 1625], loss: 0.912, per_step_time: 1471ms, lr: 1.0722744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43560 samples/s/p 0:11:22 } +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1163/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.0716547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43610 samples/s/p 0:11:19 } +2024-07-26 01:02:58,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1165/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.0710376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:58,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.42997 samples/s/p 0:11:17 } +2024-07-26 01:03:01,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1167/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 1.070424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43112 samples/s/p 0:11:14 } +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1169/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.0698112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43743 samples/s/p 0:11:10 } +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1171/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.0692028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:07,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43798 samples/s/p 0:11:07 } +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1173/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.0685951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:10,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43283 samples/s/p 0:11:05 } +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1175/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0679919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43572 samples/s/p 0:11:02 } +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1177/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.0673913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43576 samples/s/p 0:10:59 } +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1179/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.0667932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43154 samples/s/p 0:10:56 } +2024-07-26 01:03:22,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1181/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0661968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:22,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43544 samples/s/p 0:10:53 } +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1183/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.0656022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43981 samples/s/p 0:10:50 } +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1185/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.0650127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:27,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42788 samples/s/p 0:10:48 } +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1187/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0644251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43139 samples/s/p 0:10:45 } +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1189/ 1625], loss: 1.031, per_step_time: 1474ms, lr: 1.0638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:33,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42720 samples/s/p 0:10:42 } +2024-07-26 01:03:36,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1191/ 1625], loss: 0.941, per_step_time: 1473ms, lr: 1.0632566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42933 samples/s/p 0:10:39 } +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1193/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.0626775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:39,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43820 samples/s/p 0:10:35 } +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1195/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.0621011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43377 samples/s/p 0:10:33 } +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1197/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 1.0615246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.44036 samples/s/p 0:10:29 } +2024-07-26 01:03:48,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1199/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 1.0609533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:48,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43050 samples/s/p 0:10:27 } +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1201/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.0603829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43153 samples/s/p 0:10:24 } +2024-07-26 01:03:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1203/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0598177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43405 samples/s/p 0:10:21 } +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1205/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.0592541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43565 samples/s/p 0:10:18 } +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1207/ 1625], loss: 0.954, per_step_time: 1471ms, lr: 1.0586924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43509 samples/s/p 0:10:15 } +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1209/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0581332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43778 samples/s/p 0:10:12 } +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1211/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0575784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43091 samples/s/p 0:10:09 } +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1213/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.0570244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43320 samples/s/p 0:10:06 } +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1215/ 1625], loss: 1.362, per_step_time: 1470ms, lr: 1.0564738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43999 samples/s/p 0:10:02 } +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1217/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.0559268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42976 samples/s/p 0:10:01 } +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1219/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 1.0553805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:18,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43027 samples/s/p 0:09:58 } +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1221/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0548387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43207 samples/s/p 0:09:54 } +2024-07-26 01:04:24,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1223/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.0542967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.44133 samples/s/p 0:09:51 } +2024-07-26 01:04:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1225/ 1625], loss: 1.046, per_step_time: 1472ms, lr: 1.0537617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43461 samples/s/p 0:09:48 } +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1227/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0532268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43600 samples/s/p 0:09:45 } +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1229/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0526935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43702 samples/s/p 0:09:42 } +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1231/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.0521646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43329 samples/s/p 0:09:40 } +2024-07-26 01:04:38,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1233/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0516374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:38,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43148 samples/s/p 0:09:37 } +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1235/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.0511145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43365 samples/s/p 0:09:34 } +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1237/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.0505934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.44194 samples/s/p 0:09:30 } +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1239/ 1625], loss: 1.200, per_step_time: 1475ms, lr: 1.0500747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.42055 samples/s/p 0:09:29 } +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1241/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.0495597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43319 samples/s/p 0:09:25 } +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1243/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.0490463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:53,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43717 samples/s/p 0:09:22 } +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1245/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 1.0485355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44080 samples/s/p 0:09:18 } +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1247/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 1.0480273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43611 samples/s/p 0:09:16 } +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1249/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.0475218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43234 samples/s/p 0:09:13 } +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1251/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 1.0470196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43418 samples/s/p 0:09:10 } +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1253/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.0465192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:08,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43631 samples/s/p 0:09:07 } +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1255/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.0460213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.42645 samples/s/p 0:09:05 } +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1257/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 1.0455278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:14,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44117 samples/s/p 0:09:01 } +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1259/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0450344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43731 samples/s/p 0:08:58 } +2024-07-26 01:05:20,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.044546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:20,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43696 samples/s/p 0:08:55 } +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1263/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.0440604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:23,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43148 samples/s/p 0:08:53 } +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1265/ 1625], loss: 0.953, per_step_time: 1471ms, lr: 1.0435755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43729 samples/s/p 0:08:49 } +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1267/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.0430958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.44047 samples/s/p 0:08:46 } +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1269/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0426162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43825 samples/s/p 0:08:43 } +2024-07-26 01:05:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1271/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.042139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43705 samples/s/p 0:08:40 } +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1273/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.0416654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43178 samples/s/p 0:08:38 } +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1275/ 1625], loss: 0.948, per_step_time: 1470ms, lr: 1.0411961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43990 samples/s/p 0:08:34 } +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1277/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.0407277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44172 samples/s/p 0:08:31 } +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1279/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.0402645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43173 samples/s/p 0:08:29 } +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1281/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.0398012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44012 samples/s/p 0:08:25 } +2024-07-26 01:05:52,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1283/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.0393405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:52,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43447 samples/s/p 0:08:23 } +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1285/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0388834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43263 samples/s/p 0:08:20 } +2024-07-26 01:05:58,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1287/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0384288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:58,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43303 samples/s/p 0:08:17 } +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1289/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.0379767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43376 samples/s/p 0:08:14 } +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1291/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.0375273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43476 samples/s/p 0:08:11 } +2024-07-26 01:06:07,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1293/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.0370796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:07,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.42864 samples/s/p 0:08:09 } +2024-07-26 01:06:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1295/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0366372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43263 samples/s/p 0:08:05 } +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1297/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.0361964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:13,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43495 samples/s/p 0:08:02 } +2024-07-26 01:06:16,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1299/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.0357581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:16,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43961 samples/s/p 0:07:59 } +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1301/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.0353217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43756 samples/s/p 0:07:56 } +2024-07-26 01:06:22,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1303/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.034887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43696 samples/s/p 0:07:53 } +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1305/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.0344575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43950 samples/s/p 0:07:50 } +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1307/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.0340297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43334 samples/s/p 0:07:48 } +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1309/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0336053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:30,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43093 samples/s/p 0:07:45 } +2024-07-26 01:06:33,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1311/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.0331818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:33,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43459 samples/s/p 0:07:42 } +2024-07-26 01:06:36,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1313/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.0327626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:36,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43063 samples/s/p 0:07:39 } +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1315/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.0323444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44201 samples/s/p 0:07:35 } +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1317/ 1625], loss: 1.289, per_step_time: 1469ms, lr: 1.0319303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44221 samples/s/p 0:07:32 } +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1319/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0315181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43432 samples/s/p 0:07:30 } +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1321/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.0311085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44062 samples/s/p 0:07:27 } +2024-07-26 01:06:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1323/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.0307023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43555 samples/s/p 0:07:24 } +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1325/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.0302995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43228 samples/s/p 0:07:21 } +2024-07-26 01:06:57,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1327/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0298976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43682 samples/s/p 0:07:18 } +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1329/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43754 samples/s/p 0:07:15 } +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1331/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0291034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43252 samples/s/p 0:07:12 } +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1333/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.0287101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43321 samples/s/p 0:07:09 } +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1335/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.0283194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43430 samples/s/p 0:07:06 } +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1337/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.0279323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:12,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43276 samples/s/p 0:07:04 } +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1339/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.0275477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43685 samples/s/p 0:07:00 } +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1341/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.0271639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42790 samples/s/p 0:06:58 } +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1343/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 1.0267854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43087 samples/s/p 0:06:55 } +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1345/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.0264085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43248 samples/s/p 0:06:52 } +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1347/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.0260335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.44045 samples/s/p 0:06:48 } +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1349/ 1625], loss: 1.021, per_step_time: 1473ms, lr: 1.0256618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42877 samples/s/p 0:06:46 } +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1351/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.025291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43136 samples/s/p 0:06:43 } +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1353/ 1625], loss: 1.098, per_step_time: 1479ms, lr: 1.0249263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.40716 samples/s/p 0:06:42 } +2024-07-26 01:07:38,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1355/ 1625], loss: 1.032, per_step_time: 1473ms, lr: 1.0245616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:38,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42759 samples/s/p 0:06:37 } +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1357/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0242012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43179 samples/s/p 0:06:34 } +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1359/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.0238425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43469 samples/s/p 0:06:31 } +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1361/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0234857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:47,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43956 samples/s/p 0:06:28 } +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1363/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.023133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43393 samples/s/p 0:06:25 } +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1365/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.022783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43604 samples/s/p 0:06:22 } +2024-07-26 01:07:56,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1367/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0224346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:56,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43233 samples/s/p 0:06:19 } +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1369/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0220889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43389 samples/s/p 0:06:16 } +2024-07-26 01:08:02,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1371/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.0217484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43889 samples/s/p 0:06:13 } +2024-07-26 01:08:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1373/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0214079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43286 samples/s/p 0:06:11 } +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1375/ 1625], loss: 1.065, per_step_time: 1469ms, lr: 1.0210725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44287 samples/s/p 0:06:07 } +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1377/ 1625], loss: 0.925, per_step_time: 1470ms, lr: 1.0207364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44079 samples/s/p 0:06:04 } +2024-07-26 01:08:14,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1379/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 1.0204053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43528 samples/s/p 0:06:02 } +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1381/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.0200761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:17,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42758 samples/s/p 0:05:59 } +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1383/ 1625], loss: 1.464, per_step_time: 1473ms, lr: 1.0197493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42801 samples/s/p 0:05:56 } +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1385/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 1.0194253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43816 samples/s/p 0:05:53 } +2024-07-26 01:08:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1387/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.0191037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43069 samples/s/p 0:05:50 } +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1389/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.0187874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42957 samples/s/p 0:05:47 } +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1391/ 1625], loss: 1.022, per_step_time: 1469ms, lr: 1.0184702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44252 samples/s/p 0:05:43 } +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1393/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 1.0181583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.42950 samples/s/p 0:05:41 } +2024-07-26 01:08:37,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1395/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.017848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:37,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44096 samples/s/p 0:05:38 } +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1397/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0175395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43561 samples/s/p 0:05:35 } +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1399/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.0172334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43622 samples/s/p 0:05:32 } +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1401/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0169335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43273 samples/s/p 0:05:29 } +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1403/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0166336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43546 samples/s/p 0:05:26 } +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1405/ 1625], loss: 1.306, per_step_time: 1471ms, lr: 1.0163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43479 samples/s/p 0:05:23 } +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1407/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.0160417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43829 samples/s/p 0:05:20 } +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1409/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.0157504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43801 samples/s/p 0:05:17 } +2024-07-26 01:09:01,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1411/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0154608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:01,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43546 samples/s/p 0:05:14 } +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1413/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.0151748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:04,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43171 samples/s/p 0:05:12 } +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1415/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0148922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43559 samples/s/p 0:05:09 } +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1417/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 1.0146105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.42494 samples/s/p 0:05:06 } +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1419/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.0143322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43713 samples/s/p 0:05:03 } +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1421/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.0140565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.44055 samples/s/p 0:04:59 } +2024-07-26 01:09:19,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1423/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 1.0137842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:19,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44085 samples/s/p 0:04:57 } +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1425/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.0135137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44339 samples/s/p 0:04:53 } +2024-07-26 01:09:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1427/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0132458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43502 samples/s/p 0:04:51 } +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1429/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0129821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43604 samples/s/p 0:04:48 } +2024-07-26 01:09:30,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1431/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.0127186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43002 samples/s/p 0:04:45 } +2024-07-26 01:09:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1433/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 1.0124593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43992 samples/s/p 0:04:42 } +2024-07-26 01:09:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1435/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.0122026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43869 samples/s/p 0:04:39 } +2024-07-26 01:09:39,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1437/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.0119476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43647 samples/s/p 0:04:36 } +2024-07-26 01:09:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1439/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.0116961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.42992 samples/s/p 0:04:34 } +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1441/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 1.0114472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:45,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43698 samples/s/p 0:04:30 } +2024-07-26 01:09:48,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1443/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.0112018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:48,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43687 samples/s/p 0:04:27 } +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1445/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.010958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43397 samples/s/p 0:04:24 } +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.0107178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43695 samples/s/p 0:04:21 } +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1449/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0104792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43146 samples/s/p 0:04:19 } +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1451/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0102442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43238 samples/s/p 0:04:16 } +2024-07-26 01:10:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1453/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0100108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:03,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43564 samples/s/p 0:04:13 } +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1455/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.0097809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43870 samples/s/p 0:04:10 } +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1457/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 1.0095536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43411 samples/s/p 0:04:07 } +2024-07-26 01:10:12,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1459/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.0093289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43265 samples/s/p 0:04:04 } +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1461/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0091077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:15,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43813 samples/s/p 0:04:01 } +2024-07-26 01:10:18,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1463/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.0088872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43446 samples/s/p 0:03:58 } +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1465/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.008672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43715 samples/s/p 0:03:55 } +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1467/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.008456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43295 samples/s/p 0:03:52 } +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1469/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 1.0082451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.44370 samples/s/p 0:03:49 } +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1471/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.0080369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43282 samples/s/p 0:03:46 } +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1473/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.0078303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43487 samples/s/p 0:03:43 } +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1475/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 1.007628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.44169 samples/s/p 0:03:40 } +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1477/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.0074266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43794 samples/s/p 0:03:37 } +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1479/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0072288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43122 samples/s/p 0:03:35 } +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1481/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.0070335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43092 samples/s/p 0:03:32 } +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1483/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 1.0068399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43070 samples/s/p 0:03:29 } +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1485/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.0066514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43310 samples/s/p 0:03:26 } +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1487/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 1.0064639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43171 samples/s/p 0:03:23 } +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1489/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.0062789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43979 samples/s/p 0:03:20 } +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1491/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0060966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:59,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43779 samples/s/p 0:03:17 } +2024-07-26 01:11:02,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1493/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.0059176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:02,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.44156 samples/s/p 0:03:14 } +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1495/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.0057405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43162 samples/s/p 0:03:11 } +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1497/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 1.0055668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43482 samples/s/p 0:03:08 } +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1499/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.0053948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43466 samples/s/p 0:03:05 } +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1501/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0052271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43907 samples/s/p 0:03:02 } +2024-07-26 01:11:17,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1503/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 1.0050603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:17,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.42607 samples/s/p 0:02:59 } +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1505/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 1.0048986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:20,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42681 samples/s/p 0:02:56 } +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1507/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 1.0047371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43697 samples/s/p 0:02:53 } +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1509/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.0045788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42902 samples/s/p 0:02:50 } +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1511/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0044242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43512 samples/s/p 0:02:47 } +2024-07-26 01:11:31,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1513/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.0042712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:31,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.44057 samples/s/p 0:02:44 } +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1515/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.00412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43745 samples/s/p 0:02:41 } +2024-07-26 01:11:37,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1517/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.0039756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:37,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43783 samples/s/p 0:02:38 } +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1519/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0038295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43719 samples/s/p 0:02:35 } +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1521/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.0036896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43719 samples/s/p 0:02:33 } +2024-07-26 01:11:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1523/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.0035478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:46,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.44052 samples/s/p 0:02:29 } +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1525/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.0034121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:49,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43363 samples/s/p 0:02:27 } +2024-07-26 01:11:52,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1527/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.0032782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:52,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43414 samples/s/p 0:02:24 } +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1529/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.0031486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43541 samples/s/p 0:02:21 } +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1531/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.0030188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:58,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43703 samples/s/p 0:02:18 } +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1533/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0028936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43525 samples/s/p 0:02:15 } +2024-07-26 01:12:04,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1535/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 1.0027709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:04,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43439 samples/s/p 0:02:12 } +2024-07-26 01:12:07,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1537/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 1.0026498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:07,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42418 samples/s/p 0:02:09 } +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1539/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.0025315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43827 samples/s/p 0:02:06 } +2024-07-26 01:12:13,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1541/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.0024182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:13,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43754 samples/s/p 0:02:03 } +2024-07-26 01:12:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1543/ 1625], loss: 1.210, per_step_time: 1475ms, lr: 1.0023033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:16,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42263 samples/s/p 0:02:00 } +2024-07-26 01:12:19,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1545/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0021944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:19,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43556 samples/s/p 0:01:57 } +2024-07-26 01:12:22,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1547/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.0020872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:22,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43310 samples/s/p 0:01:54 } +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1549/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.0019844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43368 samples/s/p 0:01:51 } +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1551/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.0018815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:27,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43439 samples/s/p 0:01:48 } +2024-07-26 01:12:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1553/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 1.0017839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:30,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43957 samples/s/p 0:01:45 } +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1555/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.0016853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43971 samples/s/p 0:01:42 } +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1557/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.0015929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43307 samples/s/p 0:01:40 } +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1559/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.0015021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43105 samples/s/p 0:01:37 } +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1561/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 1.0014131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.44245 samples/s/p 0:01:34 } +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1563/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.0013284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43505 samples/s/p 0:01:31 } +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1565/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.0012462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43571 samples/s/p 0:01:28 } +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1567/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0011634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43688 samples/s/p 0:01:25 } +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1569/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0010881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43434 samples/s/p 0:01:22 } +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1571/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.001012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43602 samples/s/p 0:01:19 } +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1573/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.0009412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43909 samples/s/p 0:01:16 } +2024-07-26 01:13:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1575/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.0008712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:03,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43190 samples/s/p 0:01:13 } +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1577/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0008029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43688 samples/s/p 0:01:10 } +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1579/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 1.000738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43453 samples/s/p 0:01:07 } +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1581/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.0006768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43453 samples/s/p 0:01:04 } +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1583/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.000618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43352 samples/s/p 0:01:01 } +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1585/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.0005626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43963 samples/s/p 0:00:58 } +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1587/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0005091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43292 samples/s/p 0:00:55 } +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1589/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.000458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.44155 samples/s/p 0:00:52 } +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1591/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0004088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:26,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43685 samples/s/p 0:00:50 } +2024-07-26 01:13:29,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1593/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0003639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:29,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43568 samples/s/p 0:00:47 } +2024-07-26 01:13:32,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1595/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.0003206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43312 samples/s/p 0:00:44 } +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1597/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.0002809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43656 samples/s/p 0:00:41 } +2024-07-26 01:13:38,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1599/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.0002437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:38,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43594 samples/s/p 0:00:38 } +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1601/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.0002083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42829 samples/s/p 0:00:35 } +2024-07-26 01:13:44,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1603/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.0001771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:44,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43740 samples/s/p 0:00:32 } +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1605/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.0001469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:47,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43515 samples/s/p 0:00:29 } +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1607/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0001202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43280 samples/s/p 0:00:26 } +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1609/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0000967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:53,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43474 samples/s/p 0:00:23 } +2024-07-26 01:13:56,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1611/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0000743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:56,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43599 samples/s/p 0:00:20 } +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1613/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0000579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:59,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43377 samples/s/p 0:00:17 } +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1615/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.0000398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42836 samples/s/p 0:00:14 } +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1617/ 1625], loss: 0.922, per_step_time: 1471ms, lr: 1.0000276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43544 samples/s/p 0:00:11 } +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1619/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0000164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43417 samples/s/p 0:00:08 } +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1621/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 1.0000086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:11,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.42850 samples/s/p 0:00:05 } +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1623/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.0000026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43313 samples/s/p 0:00:02 } +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1625/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.0000009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:17,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |██████████████████████████████████████████████████| 5.43075 samples/s/p 0:00:00 } +2024-07-26 01:14:17,187 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 01:14:48,629 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_1.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_1.log" new file mode 100644 index 00000000..0c5bba57 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_1.log" @@ -0,0 +1,16898 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:19.659.051 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:20.659.923 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:23.660.145 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:26.660.347 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:26.660.671 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 1 rank id: 1 +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:52.264.488 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:52.265.090 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(62193,ffff990a5010,python):2024-07-25-18:09:53.345.503 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-25 18:09:53,349 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_1.ckpt' +2024-07-25 18:09:53,386 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-25 18:09:53,386 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-25 18:09:53,386 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-25 18:09:53,387 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-25 18:09:53,388 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/MindFormers/mindformers/research/output' +2024-07-25 18:09:53,388 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-25 18:09:53,388 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-25 18:09:53,389 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-25 18:09:53,389 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-25 18:09:53,389 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,390 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-25 18:09:53,390 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-25 18:09:53,390 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-25 18:09:53,390 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,391 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-25 18:09:53,391 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-25 18:09:53,391 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-25 18:09:53,391 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-25 18:09:53,399 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:1625 +2024-07-25 18:09:53,400 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:10, sink_size:2 +2024-07-25 18:09:53,400 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:1625 +2024-07-25 18:09:53,400 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-25 18:09:53,400 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-25 18:09:53,401 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-25 18:09:53,402 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-25 18:09:53,402 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:09:53.404.314 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:09:53.407.147 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-25 18:09:53,521 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:09:53.522.768 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:09:53.522.909 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-25 18:09:53,542 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,563 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,585 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,607 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,628 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,649 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,670 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,691 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,711 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:54,194 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,393 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,416 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-25 18:09:54,416 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-25 18:09:54,416 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-25 18:09:54,416 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-25 18:09:54,422 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-25 18:09:54,426 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-25 18:09:54,527 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-25 18:09:54,527 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-25 18:09:54,534 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-25 18:09:54,536 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-25 18:09:54,537 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-25 18:09:54,538 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:37.429.10 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.182.92 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.190.44 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.195.00 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.158.196 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.205.166 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.248.018 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.398.538 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:42.980.328 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:43.564.941 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.145.208 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.146.173 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.146.616 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.286.137 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.324.032 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.367.161 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:44.531.174 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:45.116.020 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:45.702.129 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.282.448 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.283.347 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.283.791 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.431.821 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.471.293 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.513.446 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:46.651.578 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:47.234.143 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:47.818.354 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.386.328 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.387.191 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.387.619 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.552.910 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.592.449 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.631.263 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:48.810.674 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:49.447.476 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.327.73 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.605.765 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.606.584 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.607.037 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.765.199 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.805.765 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:50.847.583 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:51.226.12 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:51.665.216 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:52.271.568 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:52.854.610 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:52.855.519 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:52.856.047 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:53.290.44 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:53.714.07 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:53.111.666 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:53.286.724 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:53.924.160 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:54.529.883 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.125.066 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.126.087 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.126.564 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.334.957 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.377.320 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.418.152 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:55.592.342 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:56.187.653 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:56.782.915 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.374.493 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.375.364 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.375.803 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.547.403 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.591.756 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.647.076 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:57.830.899 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:58.429.278 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.256.97 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.618.082 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.619.013 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.619.468 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.798.847 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.855.599 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:11:59.911.774 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:00.108.707 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:00.713.788 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:01.302.079 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:01.886.144 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:01.887.093 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:01.887.525 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:02.613.96 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:02.113.884 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:02.165.175 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:02.340.584 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:02.922.908 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:03.499.771 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.706.31 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.715.90 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.720.33 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.249.306 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.303.593 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.354.591 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:04.529.999 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:05.102.915 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:05.683.181 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.255.959 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.256.909 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.257.426 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.430.246 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.478.236 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.525.298 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:06.713.017 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:07.285.800 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:07.850.617 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.429.091 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.430.053 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.430.553 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.600.711 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.655.258 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.698.440 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:08.872.770 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:09.483.047 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.774.55 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.685.892 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.686.804 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.687.263 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.872.581 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.921.694 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:10.970.078 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:11.141.632 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:11.756.077 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:12.349.128 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:12.924.781 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:12.925.699 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:12.926.140 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:13.107.257 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:13.158.564 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:13.209.701 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:13.384.918 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:13.981.234 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:14.561.507 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.151.601 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.152.502 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.152.947 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.327.646 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.378.212 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.436.265 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:15.622.030 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:16.241.500 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:16.830.281 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.425.310 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.426.174 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.426.607 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.591.840 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.661.151 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.706.859 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:17.885.141 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:18.486.870 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.819.49 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.659.428 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.660.324 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.660.764 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.828.202 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.878.227 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:19.923.120 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:20.972.67 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:20.687.600 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:21.266.974 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:21.849.806 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:21.850.723 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:21.851.170 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:22.244.39 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:22.798.57 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:22.134.776 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:22.317.861 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:22.915.407 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:23.500.759 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.925.07 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.933.98 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.938.26 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.263.128 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.325.144 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.375.009 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:24.560.076 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:25.184.648 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:25.786.703 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.396.732 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.397.638 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.398.080 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.576.707 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.629.232 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.705.857 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:26.896.699 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:27.512.005 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:28.168.843 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:28.777.364 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:28.778.309 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:28.778.754 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:28.984.640 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:29.381.72 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:29.929.55 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:29.285.405 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:29.897.193 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:30.510.711 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.119.020 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.119.950 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.120.411 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.298.352 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.355.342 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.433.376 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:31.616.943 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:32.218.324 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:32.831.436 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.442.126 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.443.054 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.443.505 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.647.426 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.704.147 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.755.430 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:33.945.494 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:34.555.636 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:35.163.550 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:35.770.545 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:35.771.407 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:35.771.843 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:35.957.685 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:36.129.90 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:36.654.49 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:36.332.854 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:36.945.564 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:37.540.884 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.180.433 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.181.369 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.181.819 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.414.659 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.472.612 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.522.640 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:38.736.544 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:39.327.214 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:39.972.016 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.597.960 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.599.158 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.599.613 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.772.908 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.824.750 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:40.876.134 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:41.561.92 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:41.659.602 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:42.273.267 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:42.889.471 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:42.890.395 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:42.890.846 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:43.646.31 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:43.130.851 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:43.182.449 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:43.353.791 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:43.959.697 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:44.553.330 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.180.660 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.181.592 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.182.050 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.357.711 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.418.879 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.467.484 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:45.665.496 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:46.253.260 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:46.836.740 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.433.213 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.434.157 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.434.604 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.611.603 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.663.378 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.714.613 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:47.913.061 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:48.531.130 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:49.115.619 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:49.746.818 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:49.747.699 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:49.748.129 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:49.940.044 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:50.482.79 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:50.982.86 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:50.319.447 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:50.921.991 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:51.577.124 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.372.995 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.374.223 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.374.679 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.552.961 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.601.803 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.651.373 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:52.833.362 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:53.434.113 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:54.392.74 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:54.642.240 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:12:54.643.168 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:27.448.179 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:27.452.663 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:37.860.325 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:37.864.524 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:48.229.730 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:48.233.862 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:58.509.954 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:13:58.514.284 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:08.835.753 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:08.839.924 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:19.101.570 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:19.105.922 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:29.432.081 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:29.436.559 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:39.750.067 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:39.754.217 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:50.286.41 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:14:50.330.42 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:00.341.852 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:00.346.082 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:10.584.267 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:10.588.582 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:20.931.161 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:20.935.327 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:31.243.944 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:31.248.276 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:41.580.200 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:41.584.560 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:51.853.948 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:15:51.858.129 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:02.169.491 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:02.173.842 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:12.533.548 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:12.537.771 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:22.837.291 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:22.841.672 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:33.181.055 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:33.185.296 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:43.510.484 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:43.514.713 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:53.845.127 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:16:53.849.525 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:04.171.540 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:04.175.764 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:14.439.414 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:14.443.737 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:24.793.044 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:24.797.326 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:35.130.532 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:35.134.771 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:45.414.241 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:45.418.633 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:55.707.324 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:17:55.711.550 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:05.967.954 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:05.972.320 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:16.264.569 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:16.268.968 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:26.528.924 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:26.533.187 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:36.854.892 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:36.859.288 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:47.119.625 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:47.123.917 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:18:57.372.551 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:19:22.394.196 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:19:22.394.745 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-25 18:19:22,395 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-25 18:19:22,397 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-25 18:19:22,397 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:19:22.398.797 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_end', 'epoch_begin', 'step_begin', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(62193:281473249333264,MainProcess):2024-07-25-18:19:22.398.954 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'epoch_end', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.586.591 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.587.423 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.588.105 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.588.785 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.589.492 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.590.174 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.590.884 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.591.552 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.592.214 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.592.868 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.593.559 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.594.249 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.594.939 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.595.603 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.596.275 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.596.927 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.597.606 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.598.259 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.598.901 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.599.546 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.600.196 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.600.852 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.601.542 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.602.203 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.602.874 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.603.533 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.604.188 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.604.836 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.605.500 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.606.141 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.606.810 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.607.461 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.607.917 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.608.638 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.609.401 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.610.145 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.610.888 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.611.630 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.612.398 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.613.136 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.613.901 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.614.645 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.615.389 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.616.129 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.616.879 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.617.657 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.618.413 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.619.145 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.619.859 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.620.602 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.621.333 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.622.047 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.622.747 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.623.445 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.624.151 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.624.835 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.625.543 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.626.182 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.626.795 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.627.410 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.628.030 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.628.649 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.629.307 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:50.629.931 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62193,ffff990a5010,python):2024-07-25-18:19:53.308.256 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | / 2024-07-25 18:28:34,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 2/ 1625], loss: 1.518, per_step_time: 275416ms, lr: 1.8461538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02905 samples/s/p 51 days, 19:02:48 } +2024-07-25 18:28:38,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 4/ 1625], loss: 1.444, per_step_time: 1637ms, lr: 5.538461e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 4.88473 samples/s/p 7:23:27 } +2024-07-25 18:28:41,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 6/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 9.230769e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:41,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.42973 samples/s/p 6:38:53 } +2024-07-25 18:28:44,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 8/ 1625], loss: 1.351, per_step_time: 1479ms, lr: 1.2923077e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:44,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.40719 samples/s/p 6:40:30 } +2024-07-25 18:28:47,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 10/ 1625], loss: 1.390, per_step_time: 1470ms, lr: 1.6615384e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:47,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.44181 samples/s/p 6:37:54 } +2024-07-25 18:28:50,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 12/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 2.0307691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:50,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43361 samples/s/p 6:38:27 } +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 14/ 1625], loss: 1.447, per_step_time: 1471ms, lr: 2.4e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:52,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43800 samples/s/p 6:38:05 } +2024-07-25 18:28:55,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 16/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.7692306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:55,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43287 samples/s/p 6:38:24 } +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 18/ 1625], loss: 1.406, per_step_time: 1474ms, lr: 3.1384613e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42720 samples/s/p 6:38:46 } +2024-07-25 18:29:01,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 20/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 3.5076923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:01,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43465 samples/s/p 6:38:11 } +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 22/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 3.876923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42816 samples/s/p 6:38:36 } +2024-07-25 18:29:07,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 24/ 1625], loss: 1.562, per_step_time: 1471ms, lr: 4.2461537e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:07,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43605 samples/s/p 6:37:59 } +2024-07-25 18:29:10,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 26/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 4.6153846e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43697 samples/s/p 6:37:52 } +2024-07-25 18:29:13,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 28/ 1625], loss: 1.523, per_step_time: 1471ms, lr: 4.9846153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:13,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43669 samples/s/p 6:37:50 } +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 30/ 1625], loss: 1.471, per_step_time: 1473ms, lr: 5.3538463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42989 samples/s/p 6:38:17 } +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 32/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 5.7230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:19,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43645 samples/s/p 6:37:45 } +2024-07-25 18:29:22,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 34/ 1625], loss: 1.483, per_step_time: 1471ms, lr: 6.092307e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:22,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43728 samples/s/p 6:37:38 } +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 36/ 1625], loss: 1.478, per_step_time: 1472ms, lr: 6.461538e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43337 samples/s/p 6:37:53 } +2024-07-25 18:29:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 38/ 1625], loss: 1.330, per_step_time: 1474ms, lr: 6.8307685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42700 samples/s/p 6:38:18 } +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 40/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 7.2e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42667 samples/s/p 6:38:16 } +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 42/ 1625], loss: 1.627, per_step_time: 1473ms, lr: 7.5692304e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42959 samples/s/p 6:38:00 } +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 44/ 1625], loss: 1.519, per_step_time: 1471ms, lr: 7.9384614e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43812 samples/s/p 6:37:20 } +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 46/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 8.307692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42953 samples/s/p 6:37:55 } +2024-07-25 18:29:43,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 48/ 1625], loss: 1.576, per_step_time: 1472ms, lr: 8.676922e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:43,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43436 samples/s/p 6:37:31 } +2024-07-25 18:29:46,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 50/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 9.046154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:46,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42782 samples/s/p 6:37:56 } +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 52/ 1625], loss: 1.520, per_step_time: 1472ms, lr: 9.4153836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43202 samples/s/p 6:37:35 } +2024-07-25 18:29:52,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 54/ 1625], loss: 1.476, per_step_time: 1473ms, lr: 9.784615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:52,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42964 samples/s/p 6:37:43 } +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 56/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 1.0153847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43012 samples/s/p 6:37:38 } +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 58/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 1.0523077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42757 samples/s/p 6:37:46 } +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 60/ 1625], loss: 1.523, per_step_time: 1473ms, lr: 1.0892308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42805 samples/s/p 6:37:41 } +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 62/ 1625], loss: 1.416, per_step_time: 1473ms, lr: 1.1261538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:03,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43027 samples/s/p 6:37:28 } +2024-07-25 18:30:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 64/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.1630768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:06,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43161 samples/s/p 6:37:19 } +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 66/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 1.1999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43315 samples/s/p 6:37:09 } +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 68/ 1625], loss: 1.436, per_step_time: 1471ms, lr: 1.236923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43823 samples/s/p 6:36:44 } +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 70/ 1625], loss: 1.423, per_step_time: 1471ms, lr: 1.2738461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:15,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43795 samples/s/p 6:36:43 } +2024-07-25 18:30:18,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 72/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.3107691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:18,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43692 samples/s/p 6:36:44 } +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 74/ 1625], loss: 1.433, per_step_time: 1475ms, lr: 1.3476922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:21,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42306 samples/s/p 6:37:42 } +2024-07-25 18:30:24,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 76/ 1625], loss: 1.482, per_step_time: 1472ms, lr: 1.3846154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43364 samples/s/p 6:36:53 } +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 78/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.4215384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42838 samples/s/p 6:37:13 } +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 80/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 1.4584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42933 samples/s/p 6:37:06 } +2024-07-25 18:30:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 82/ 1625], loss: 1.471, per_step_time: 1474ms, lr: 1.4953846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42444 samples/s/p 6:37:24 } +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 84/ 1625], loss: 1.493, per_step_time: 1472ms, lr: 1.5323077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43412 samples/s/p 6:36:39 } +2024-07-25 18:30:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 86/ 1625], loss: 1.431, per_step_time: 1473ms, lr: 1.5692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42802 samples/s/p 6:37:03 } +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 88/ 1625], loss: 1.613, per_step_time: 1471ms, lr: 1.6061538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:42,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43705 samples/s/p 6:36:20 } +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 90/ 1625], loss: 1.673, per_step_time: 1483ms, lr: 1.6430769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.39384 samples/s/p 6:39:28 } +2024-07-25 18:30:48,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 92/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 1.6799999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43722 samples/s/p 6:36:13 } +2024-07-25 18:30:51,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 94/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.716923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:51,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43501 samples/s/p 6:36:20 } +2024-07-25 18:30:54,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 96/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.753846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43663 samples/s/p 6:36:10 } +2024-07-25 18:30:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 98/ 1625], loss: 1.372, per_step_time: 1470ms, lr: 1.7907691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.44021 samples/s/p 6:35:52 } +2024-07-25 18:30:59,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 100/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.8276922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:59,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43828 samples/s/p 6:35:57 } +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 102/ 1625], loss: 1.413, per_step_time: 1472ms, lr: 1.8646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:02,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43292 samples/s/p 6:36:18 } +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 104/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.9015384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43256 samples/s/p 6:36:16 } +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 106/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.9384615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.42885 samples/s/p 6:36:29 } +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 108/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 1.9753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43515 samples/s/p 6:35:59 } +2024-07-25 18:31:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 110/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.0123075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43736 samples/s/p 6:35:46 } +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 112/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.0492307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43757 samples/s/p 6:35:42 } +2024-07-25 18:31:20,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 114/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.0861537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:20,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43955 samples/s/p 6:35:31 } +2024-07-25 18:31:23,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 116/ 1625], loss: 1.443, per_step_time: 1471ms, lr: 2.1230767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:23,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43565 samples/s/p 6:35:45 } +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 118/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.16e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43801 samples/s/p 6:35:32 } +2024-07-25 18:31:29,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 120/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.1969229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:29,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43155 samples/s/p 6:35:57 } +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 122/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 2.233846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43315 samples/s/p 6:35:47 } +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 124/ 1625], loss: 1.370, per_step_time: 1471ms, lr: 2.270769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:35,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43599 samples/s/p 6:35:32 } +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 126/ 1625], loss: 1.199, per_step_time: 1475ms, lr: 2.307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42268 samples/s/p 6:36:27 } +2024-07-25 18:31:41,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 128/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.3446153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:41,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43588 samples/s/p 6:35:26 } +2024-07-25 18:31:44,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 130/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.3815385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42486 samples/s/p 6:36:12 } +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 132/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.4184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43478 samples/s/p 6:35:25 } +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 134/ 1625], loss: 1.484, per_step_time: 1472ms, lr: 2.4553847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43456 samples/s/p 6:35:23 } +2024-07-25 18:31:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 136/ 1625], loss: 1.322, per_step_time: 1473ms, lr: 2.4923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:53,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42841 samples/s/p 6:35:47 } +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 138/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 2.5292306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43479 samples/s/p 6:35:16 } +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 140/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 2.5661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43381 samples/s/p 6:35:18 } +2024-07-25 18:32:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 142/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6030768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:01,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43225 samples/s/p 6:35:22 } +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 144/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.6399998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43338 samples/s/p 6:35:14 } +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 146/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.676923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43322 samples/s/p 6:35:11 } +2024-07-25 18:32:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 148/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.713846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:10,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43263 samples/s/p 6:35:11 } +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 150/ 1625], loss: 1.384, per_step_time: 1470ms, lr: 2.7507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43962 samples/s/p 6:34:38 } +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 152/ 1625], loss: 1.442, per_step_time: 1471ms, lr: 2.7876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43628 samples/s/p 6:34:49 } +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 154/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8246152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43469 samples/s/p 6:34:53 } +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 156/ 1625], loss: 1.473, per_step_time: 1471ms, lr: 2.8615384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:22,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43800 samples/s/p 6:34:36 } +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 158/ 1625], loss: 1.352, per_step_time: 1471ms, lr: 2.8984614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43586 samples/s/p 6:34:42 } +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 160/ 1625], loss: 1.335, per_step_time: 1474ms, lr: 2.9353844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:28,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.42735 samples/s/p 6:35:16 } +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 162/ 1625], loss: 1.487, per_step_time: 1471ms, lr: 2.9723076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43537 samples/s/p 6:34:38 } +2024-07-25 18:32:34,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 164/ 1625], loss: 1.285, per_step_time: 1470ms, lr: 3.0092306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:34,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43940 samples/s/p 6:34:18 } +2024-07-25 18:32:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 166/ 1625], loss: 1.387, per_step_time: 1472ms, lr: 3.0461536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43298 samples/s/p 6:34:43 } +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 168/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 3.0830768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:40,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43725 samples/s/p 6:34:21 } +2024-07-25 18:32:43,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 170/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 3.1199997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:43,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43234 samples/s/p 6:34:40 } +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 172/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 3.156923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:46,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43322 samples/s/p 6:34:33 } +2024-07-25 18:32:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 174/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.1938462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:49,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43261 samples/s/p 6:34:33 } +2024-07-25 18:32:52,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 176/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 3.2307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:52,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43346 samples/s/p 6:34:26 } +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 178/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.2676921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43459 samples/s/p 6:34:18 } +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 180/ 1625], loss: 1.463, per_step_time: 1472ms, lr: 3.3046153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:58,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43403 samples/s/p 6:34:18 } +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 182/ 1625], loss: 1.410, per_step_time: 1473ms, lr: 3.3415383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42961 samples/s/p 6:34:34 } +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 184/ 1625], loss: 1.516, per_step_time: 1471ms, lr: 3.3784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43830 samples/s/p 6:33:53 } +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 186/ 1625], loss: 1.353, per_step_time: 1473ms, lr: 3.4153845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42932 samples/s/p 6:34:30 } +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 188/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 3.4523075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43458 samples/s/p 6:34:04 } +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 190/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.4892307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:12,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43083 samples/s/p 6:34:17 } +2024-07-25 18:33:15,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 192/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 3.5261537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:15,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43006 samples/s/p 6:34:17 } +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 194/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 3.5630767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43267 samples/s/p 6:34:03 } +2024-07-25 18:33:21,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 196/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 3.6e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:21,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43539 samples/s/p 6:33:48 } +2024-07-25 18:33:24,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 198/ 1625], loss: 1.411, per_step_time: 1473ms, lr: 3.6369229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:24,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43077 samples/s/p 6:34:06 } +2024-07-25 18:33:27,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 200/ 1625], loss: 1.502, per_step_time: 1472ms, lr: 3.6738459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:27,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43448 samples/s/p 6:33:46 } +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 202/ 1625], loss: 1.411, per_step_time: 1471ms, lr: 3.710769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43742 samples/s/p 6:33:31 } +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 204/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.747692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43398 samples/s/p 6:33:43 } +2024-07-25 18:33:36,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 206/ 1625], loss: 1.352, per_step_time: 1473ms, lr: 3.784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:36,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42830 samples/s/p 6:34:04 } +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 208/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 3.8215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:39,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43325 samples/s/p 6:33:40 } +2024-07-25 18:33:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 210/ 1625], loss: 1.391, per_step_time: 1472ms, lr: 3.8584612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43201 samples/s/p 6:33:42 } +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 212/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 3.8953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43854 samples/s/p 6:33:11 } +2024-07-25 18:33:48,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 214/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 3.932307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:48,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42629 samples/s/p 6:34:01 } +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 216/ 1625], loss: 1.471, per_step_time: 1470ms, lr: 3.969231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.44098 samples/s/p 6:32:55 } +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 218/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 4.0061536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42791 samples/s/p 6:33:48 } +2024-07-25 18:33:57,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 220/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.043077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:57,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43729 samples/s/p 6:33:05 } +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 222/ 1625], loss: 1.240, per_step_time: 1474ms, lr: 4.0799996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42673 samples/s/p 6:33:48 } +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 224/ 1625], loss: 1.427, per_step_time: 1471ms, lr: 4.116923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43645 samples/s/p 6:33:03 } +2024-07-25 18:34:05,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 226/ 1625], loss: 1.358, per_step_time: 1470ms, lr: 4.153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:05,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43922 samples/s/p 6:32:48 } +2024-07-25 18:34:08,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 228/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.1907692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:08,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43402 samples/s/p 6:33:07 } +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 230/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 4.227692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42789 samples/s/p 6:33:31 } +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 232/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.264615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:14,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43140 samples/s/p 6:33:13 } +2024-07-25 18:34:17,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 234/ 1625], loss: 1.391, per_step_time: 1472ms, lr: 4.301538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:17,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43282 samples/s/p 6:33:04 } +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 236/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 4.338461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43052 samples/s/p 6:33:11 } +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 238/ 1625], loss: 1.468, per_step_time: 1472ms, lr: 4.375385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43449 samples/s/p 6:32:50 } +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 240/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 4.4123076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:26,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43415 samples/s/p 6:32:49 } +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 242/ 1625], loss: 1.520, per_step_time: 1475ms, lr: 4.449231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:29,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42216 samples/s/p 6:33:38 } +2024-07-25 18:34:32,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 244/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 4.4861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:32,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42943 samples/s/p 6:33:04 } +2024-07-25 18:34:35,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 246/ 1625], loss: 1.449, per_step_time: 1473ms, lr: 4.5230768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43055 samples/s/p 6:32:56 } +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 248/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 4.5599995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43831 samples/s/p 6:32:19 } +2024-07-25 18:34:41,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 250/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 4.596923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:41,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43013 samples/s/p 6:32:52 } +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 252/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 4.633846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43542 samples/s/p 6:32:26 } +2024-07-25 18:34:47,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 254/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 4.670769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:47,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43215 samples/s/p 6:32:37 } +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 256/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 4.707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.44297 samples/s/p 6:31:47 } +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 258/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 4.744615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43454 samples/s/p 6:32:21 } +2024-07-25 18:34:56,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 260/ 1625], loss: 1.525, per_step_time: 1471ms, lr: 4.7815383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:56,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43793 samples/s/p 6:32:03 } +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 262/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.8184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:59,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43154 samples/s/p 6:32:28 } +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 264/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 4.8553843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43308 samples/s/p 6:32:18 } +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 266/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 4.8923075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43305 samples/s/p 6:32:15 } +2024-07-25 18:35:07,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 268/ 1625], loss: 1.425, per_step_time: 1472ms, lr: 4.9292303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43124 samples/s/p 6:32:20 } +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 270/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.9661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43682 samples/s/p 6:31:53 } +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 272/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 5.0030767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43482 samples/s/p 6:31:59 } +2024-07-25 18:35:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 274/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 5.04e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43001 samples/s/p 6:32:17 } +2024-07-25 18:35:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 276/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.0769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43537 samples/s/p 6:31:51 } +2024-07-25 18:35:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 278/ 1625], loss: 1.270, per_step_time: 1474ms, lr: 5.113846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.42382 samples/s/p 6:32:38 } +2024-07-25 18:35:25,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 280/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 5.150769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43646 samples/s/p 6:31:40 } +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 282/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 5.187692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43507 samples/s/p 6:31:43 } +2024-07-25 18:35:31,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 284/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 5.2246155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:31,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43483 samples/s/p 6:31:41 } +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 286/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 5.2615383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:34,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43700 samples/s/p 6:31:29 } +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 288/ 1625], loss: 1.358, per_step_time: 1471ms, lr: 5.2984615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43590 samples/s/p 6:31:31 } +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 290/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 5.3353842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43561 samples/s/p 6:31:29 } +2024-07-25 18:35:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 292/ 1625], loss: 1.333, per_step_time: 1473ms, lr: 5.3723074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42782 samples/s/p 6:32:00 } +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 294/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 5.4092307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42658 samples/s/p 6:32:02 } +2024-07-25 18:35:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 296/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 5.446154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:49,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43379 samples/s/p 6:31:28 } +2024-07-25 18:35:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 298/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 5.4830766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:52,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43324 samples/s/p 6:31:27 } +2024-07-25 18:35:55,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 300/ 1625], loss: 1.461, per_step_time: 1473ms, lr: 5.52e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:55,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42892 samples/s/p 6:31:43 } +2024-07-25 18:35:58,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 302/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 5.5569226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:58,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.44009 samples/s/p 6:30:52 } +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 304/ 1625], loss: 1.507, per_step_time: 1472ms, lr: 5.593846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:01,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43339 samples/s/p 6:31:18 } +2024-07-25 18:36:04,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 306/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 5.630769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:04,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43872 samples/s/p 6:30:52 } +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 308/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 5.667692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:06,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43741 samples/s/p 6:30:55 } +2024-07-25 18:36:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 310/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 5.704615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:09,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43624 samples/s/p 6:30:57 } +2024-07-25 18:36:12,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 312/ 1625], loss: 1.359, per_step_time: 1473ms, lr: 5.741538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:12,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43094 samples/s/p 6:31:17 } +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 314/ 1625], loss: 1.310, per_step_time: 1470ms, lr: 5.778461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43924 samples/s/p 6:30:38 } +2024-07-25 18:36:18,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 316/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 5.8153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:18,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43798 samples/s/p 6:30:41 } +2024-07-25 18:36:21,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 318/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 5.8523074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43752 samples/s/p 6:30:40 } +2024-07-25 18:36:24,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 320/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 5.8892306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:24,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43271 samples/s/p 6:30:57 } +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 5.926154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:27,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43215 samples/s/p 6:30:57 } +2024-07-25 18:36:30,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 324/ 1625], loss: 1.425, per_step_time: 1470ms, lr: 5.9630765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:30,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43986 samples/s/p 6:30:21 } +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 326/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 5.9999998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43925 samples/s/p 6:30:20 } +2024-07-25 18:36:36,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 328/ 1625], loss: 1.466, per_step_time: 1472ms, lr: 6.036923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43248 samples/s/p 6:30:47 } +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 330/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 6.073846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:39,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43672 samples/s/p 6:30:25 } +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 332/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 6.110769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43177 samples/s/p 6:30:44 } +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 334/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 6.147692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43474 samples/s/p 6:30:28 } +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 336/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 6.184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43146 samples/s/p 6:30:39 } +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 338/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 6.221538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43658 samples/s/p 6:30:14 } +2024-07-25 18:36:54,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 340/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 6.2584613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:54,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.42769 samples/s/p 6:30:50 } +2024-07-25 18:36:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 342/ 1625], loss: 1.366, per_step_time: 1470ms, lr: 6.2953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:57,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.44054 samples/s/p 6:29:51 } +2024-07-25 18:37:00,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 344/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.3323073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:00,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43153 samples/s/p 6:30:27 } +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 346/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 6.3692305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43002 samples/s/p 6:30:31 } +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 348/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 6.4061533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43319 samples/s/p 6:30:14 } +2024-07-25 18:37:08,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 350/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 6.443077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:08,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43828 samples/s/p 6:29:49 } +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 352/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 6.4799997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:11,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43353 samples/s/p 6:30:07 } +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 354/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 6.516923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:14,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42806 samples/s/p 6:30:27 } +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 356/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 6.5538457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43890 samples/s/p 6:29:38 } +2024-07-25 18:37:20,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 358/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 6.590769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:20,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43381 samples/s/p 6:29:57 } +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 360/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 6.6276916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42674 samples/s/p 6:30:24 } +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 362/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 6.6646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:26,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43442 samples/s/p 6:29:48 } +2024-07-25 18:37:29,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 364/ 1625], loss: 1.370, per_step_time: 1474ms, lr: 6.7015385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:29,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42696 samples/s/p 6:30:17 } +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 366/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 6.7384613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43815 samples/s/p 6:29:26 } +2024-07-25 18:37:35,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 368/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 6.7753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:35,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.42755 samples/s/p 6:30:09 } +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 370/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 6.812307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:38,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43901 samples/s/p 6:29:17 } +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 372/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 6.8492304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:41,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43742 samples/s/p 6:29:21 } +2024-07-25 18:37:44,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 374/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 6.8861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:44,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43608 samples/s/p 6:29:23 } +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 376/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 6.923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43809 samples/s/p 6:29:12 } +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 378/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 6.9599996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43566 samples/s/p 6:29:19 } +2024-07-25 18:37:53,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 380/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 6.996923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43799 samples/s/p 6:29:06 } +2024-07-25 18:37:56,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 382/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 7.0338456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:56,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42963 samples/s/p 6:29:39 } +2024-07-25 18:37:59,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 384/ 1625], loss: 1.384, per_step_time: 1473ms, lr: 7.0707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:59,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42864 samples/s/p 6:29:41 } +2024-07-25 18:38:02,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 386/ 1625], loss: 1.272, per_step_time: 1474ms, lr: 7.107692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:02,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42532 samples/s/p 6:29:52 } +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 388/ 1625], loss: 1.170, per_step_time: 1483ms, lr: 7.144615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.39228 samples/s/p 6:32:12 } +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 390/ 1625], loss: 1.440, per_step_time: 1471ms, lr: 7.181538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43656 samples/s/p 6:28:58 } +2024-07-25 18:38:10,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 392/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 7.218461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:10,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43769 samples/s/p 6:28:50 } +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 394/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 7.255384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:13,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42964 samples/s/p 6:29:22 } +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 396/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 7.2923076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:16,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43020 samples/s/p 6:29:16 } +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 398/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 7.3292304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:19,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.44059 samples/s/p 6:28:29 } +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 400/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 7.3661536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43065 samples/s/p 6:29:08 } +2024-07-25 18:38:25,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 402/ 1625], loss: 1.334, per_step_time: 1474ms, lr: 7.4030763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:25,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.42487 samples/s/p 6:29:30 } +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 404/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 7.4399995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43585 samples/s/p 6:28:40 } +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 406/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 7.4769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:31,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43990 samples/s/p 6:28:20 } +2024-07-25 18:38:34,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 408/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 7.5138464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:34,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43330 samples/s/p 6:28:45 } +2024-07-25 18:38:37,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 410/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 7.5507687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:37,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43423 samples/s/p 6:28:38 } +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 412/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 7.587692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43607 samples/s/p 6:28:28 } +2024-07-25 18:38:43,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 414/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 7.624615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43909 samples/s/p 6:28:12 } +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 416/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 7.661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:46,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43950 samples/s/p 6:28:07 } +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 418/ 1625], loss: 1.314, per_step_time: 1470ms, lr: 7.698461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:49,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44200 samples/s/p 6:27:53 } +2024-07-25 18:38:52,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 420/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 7.735384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:52,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43659 samples/s/p 6:28:14 } +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 422/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 7.772307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43946 samples/s/p 6:27:58 } +2024-07-25 18:38:58,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 424/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 7.809231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:58,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.42668 samples/s/p 6:28:50 } +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 426/ 1625], loss: 1.136, per_step_time: 1477ms, lr: 7.8461535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.41433 samples/s/p 6:29:40 } +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 428/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 7.883076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43230 samples/s/p 6:28:20 } +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 430/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.92e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44244 samples/s/p 6:27:34 } +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 432/ 1625], loss: 1.374, per_step_time: 1472ms, lr: 7.956923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43180 samples/s/p 6:28:16 } +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 434/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 7.993845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43822 samples/s/p 6:27:46 } +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 436/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 8.030769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.44239 samples/s/p 6:27:25 } +2024-07-25 18:39:18,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 438/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 8.067692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:18,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43214 samples/s/p 6:28:06 } +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 440/ 1625], loss: 1.366, per_step_time: 1471ms, lr: 8.1046155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43698 samples/s/p 6:27:42 } +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 442/ 1625], loss: 1.638, per_step_time: 1471ms, lr: 8.141537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43524 samples/s/p 6:27:47 } +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 444/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.178461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:27,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43777 samples/s/p 6:27:33 } +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 446/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43740 samples/s/p 6:27:32 } +2024-07-25 18:39:33,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 448/ 1625], loss: 1.467, per_step_time: 1472ms, lr: 8.252307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:33,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43169 samples/s/p 6:27:53 } +2024-07-25 18:39:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 450/ 1625], loss: 1.318, per_step_time: 1473ms, lr: 8.289231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42941 samples/s/p 6:28:00 } +2024-07-25 18:39:39,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 452/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 8.326153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:39,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.44094 samples/s/p 6:27:08 } +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 454/ 1625], loss: 1.189, per_step_time: 1482ms, lr: 8.363077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.39707 samples/s/p 6:30:14 } +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 456/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.399999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43317 samples/s/p 6:27:35 } +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 458/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 8.436923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42898 samples/s/p 6:27:50 } +2024-07-25 18:39:51,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 460/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 8.473846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:51,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43563 samples/s/p 6:27:19 } +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 462/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 8.510769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43036 samples/s/p 6:27:38 } +2024-07-25 18:39:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 464/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 8.547692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:57,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43779 samples/s/p 6:27:04 } +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 466/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 8.584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:00,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43679 samples/s/p 6:27:05 } +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 468/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 8.621538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:03,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43816 samples/s/p 6:26:56 } +2024-07-25 18:40:06,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 470/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.658461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43690 samples/s/p 6:26:59 } +2024-07-25 18:40:09,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 472/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 8.695384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:09,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43350 samples/s/p 6:27:10 } +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 474/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 8.732308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43560 samples/s/p 6:26:58 } +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 476/ 1625], loss: 1.107, per_step_time: 1475ms, lr: 8.76923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42056 samples/s/p 6:28:00 } +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 478/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 8.806153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43090 samples/s/p 6:27:12 } +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 480/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 8.843077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.44033 samples/s/p 6:26:29 } +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 482/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 8.88e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:23,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43216 samples/s/p 6:27:01 } +2024-07-25 18:40:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 484/ 1625], loss: 1.342, per_step_time: 1476ms, lr: 8.9169225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.41699 samples/s/p 6:28:03 } +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 486/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 8.953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43783 samples/s/p 6:26:31 } +2024-07-25 18:40:32,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 488/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.990769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:32,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43171 samples/s/p 6:26:54 } +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 490/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 9.027692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43826 samples/s/p 6:26:23 } +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 492/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.064615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43262 samples/s/p 6:26:44 } +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 494/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.101538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43524 samples/s/p 6:26:30 } +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 496/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 9.138461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43811 samples/s/p 6:26:15 } +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 498/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.175385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:47,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43204 samples/s/p 6:26:38 } +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 500/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 9.212307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43602 samples/s/p 6:26:18 } +2024-07-25 18:40:53,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 502/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 9.24923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:53,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43096 samples/s/p 6:26:37 } +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 504/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 9.286154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:56,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43316 samples/s/p 6:26:25 } +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 506/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 9.3230765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43354 samples/s/p 6:26:20 } +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 508/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 9.36e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43844 samples/s/p 6:25:56 } +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 510/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 9.396922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:05,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43797 samples/s/p 6:25:55 } +2024-07-25 18:41:08,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 512/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 9.433846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:08,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44262 samples/s/p 6:25:32 } +2024-07-25 18:41:11,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 514/ 1625], loss: 1.214, per_step_time: 1474ms, lr: 9.470769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:11,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42671 samples/s/p 6:26:37 } +2024-07-25 18:41:13,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 516/ 1625], loss: 1.314, per_step_time: 1480ms, lr: 9.507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:13,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.40219 samples/s/p 6:28:20 } +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 518/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 9.544615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44009 samples/s/p 6:25:34 } +2024-07-25 18:41:19,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 520/ 1625], loss: 1.191, per_step_time: 1475ms, lr: 9.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:19,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42077 samples/s/p 6:26:54 } +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 522/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 9.618461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43417 samples/s/p 6:25:54 } +2024-07-25 18:41:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 524/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 9.655385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:25,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43597 samples/s/p 6:25:43 } +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 526/ 1625], loss: 1.433, per_step_time: 1471ms, lr: 9.692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:28,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43497 samples/s/p 6:25:44 } +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 528/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 9.72923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43938 samples/s/p 6:25:23 } +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 530/ 1625], loss: 1.409, per_step_time: 1470ms, lr: 9.766153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43869 samples/s/p 6:25:23 } +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 532/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 9.803077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:37,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43965 samples/s/p 6:25:16 } +2024-07-25 18:41:40,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 534/ 1625], loss: 1.323, per_step_time: 1470ms, lr: 9.839999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:40,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.44168 samples/s/p 6:25:04 } +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 536/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 9.876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:43,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43565 samples/s/p 6:25:27 } +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 538/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 9.913846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43335 samples/s/p 6:25:34 } +2024-07-25 18:41:49,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 540/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 9.950769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:49,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43844 samples/s/p 6:25:09 } +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 542/ 1625], loss: 1.315, per_step_time: 1475ms, lr: 9.9876925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:52,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.42166 samples/s/p 6:26:18 } +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 544/ 1625], loss: 1.386, per_step_time: 1471ms, lr: 1.0024614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43490 samples/s/p 6:25:18 } +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 546/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 1.0061538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43186 samples/s/p 6:25:28 } +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 548/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.0098462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43327 samples/s/p 6:25:19 } +2024-07-25 18:42:04,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 550/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.0135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:04,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43315 samples/s/p 6:25:17 } +2024-07-25 18:42:07,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 552/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.0172307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:07,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43784 samples/s/p 6:24:54 } +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 554/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.020923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:10,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43535 samples/s/p 6:25:02 } +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 556/ 1625], loss: 1.024, per_step_time: 1473ms, lr: 1.0246154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43031 samples/s/p 6:25:20 } +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 558/ 1625], loss: 1.404, per_step_time: 1472ms, lr: 1.0283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:15,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43191 samples/s/p 6:25:10 } +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 560/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 1.0319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43184 samples/s/p 6:25:08 } +2024-07-25 18:42:21,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 562/ 1625], loss: 1.342, per_step_time: 1471ms, lr: 1.0356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:21,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43501 samples/s/p 6:24:51 } +2024-07-25 18:42:24,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 564/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 1.03938455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:24,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.44064 samples/s/p 6:24:24 } +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 566/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.0430769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43790 samples/s/p 6:24:33 } +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 568/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43716 samples/s/p 6:24:33 } +2024-07-25 18:42:33,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 570/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:33,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43216 samples/s/p 6:24:52 } +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 572/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.0541538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42872 samples/s/p 6:25:03 } +2024-07-25 18:42:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 574/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.0578461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:39,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43203 samples/s/p 6:24:46 } +2024-07-25 18:42:42,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 576/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 1.0615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:42,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42743 samples/s/p 6:25:03 } +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 578/ 1625], loss: 1.248, per_step_time: 1475ms, lr: 1.0652307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42075 samples/s/p 6:25:28 } +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 580/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.068923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43452 samples/s/p 6:24:27 } +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 582/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.0726154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:51,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43410 samples/s/p 6:24:26 } +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 584/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.0763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:54,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43494 samples/s/p 6:24:19 } +2024-07-25 18:42:57,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 586/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.07999995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:57,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43827 samples/s/p 6:24:02 } +2024-07-25 18:43:00,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 588/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0836922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:00,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43645 samples/s/p 6:24:07 } +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 590/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 1.0873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42962 samples/s/p 6:24:33 } +2024-07-25 18:43:06,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 592/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.091077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:06,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43610 samples/s/p 6:24:02 } +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 594/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 1.0947691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43227 samples/s/p 6:24:16 } +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 596/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.0984615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:12,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43086 samples/s/p 6:24:19 } +2024-07-25 18:43:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 598/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.1021538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43473 samples/s/p 6:23:59 } +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 600/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.10584615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42938 samples/s/p 6:24:19 } +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 602/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.1095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43519 samples/s/p 6:23:52 } +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 604/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.1132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43840 samples/s/p 6:23:35 } +2024-07-25 18:43:26,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 606/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.1169231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:26,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43773 samples/s/p 6:23:35 } +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 608/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.1206153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43446 samples/s/p 6:23:46 } +2024-07-25 18:43:32,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 610/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.1243076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:32,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43810 samples/s/p 6:23:28 } +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 612/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.1279999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43520 samples/s/p 6:23:37 } +2024-07-25 18:43:38,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 614/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.1316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:38,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43292 samples/s/p 6:23:44 } +2024-07-25 18:43:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 616/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1353846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:41,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43804 samples/s/p 6:23:19 } +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 618/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.1390768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:44,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43698 samples/s/p 6:23:21 } +2024-07-25 18:43:47,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 620/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.1427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:47,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43286 samples/s/p 6:23:35 } +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 622/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 1.14646145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:50,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43330 samples/s/p 6:23:30 } +2024-07-25 18:43:53,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 624/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.1501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:53,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.42507 samples/s/p 6:24:02 } +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 626/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.1538462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43967 samples/s/p 6:22:57 } +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 628/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.1575384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43477 samples/s/p 6:23:15 } +2024-07-25 18:44:02,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 630/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 1.1612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:02,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43142 samples/s/p 6:23:26 } +2024-07-25 18:44:05,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 632/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 1.164923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:05,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.42082 samples/s/p 6:24:08 } +2024-07-25 18:44:08,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 634/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.1686154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:08,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43504 samples/s/p 6:23:05 } +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 636/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.1723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43245 samples/s/p 6:23:13 } +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 638/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1759999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43510 samples/s/p 6:22:59 } +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 640/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.1796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44146 samples/s/p 6:22:29 } +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 642/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43496 samples/s/p 6:22:54 } +2024-07-25 18:44:22,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 644/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 1.18707685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:22,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43208 samples/s/p 6:23:03 } +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 646/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 1.1907691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.44026 samples/s/p 6:22:25 } +2024-07-25 18:44:28,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 648/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 1.1944615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:28,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43714 samples/s/p 6:22:36 } +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 650/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.1981539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43598 samples/s/p 6:22:38 } +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 652/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.201846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:34,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43068 samples/s/p 6:22:57 } +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 654/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.2055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43510 samples/s/p 6:22:35 } +2024-07-25 18:44:40,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 656/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.2092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:40,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43576 samples/s/p 6:22:30 } +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 658/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.21292305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:43,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43296 samples/s/p 6:22:39 } +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 660/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.2166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:46,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43908 samples/s/p 6:22:10 } +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 662/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.2203076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43058 samples/s/p 6:22:43 } +2024-07-25 18:44:52,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 664/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 1.224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:52,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.44228 samples/s/p 6:21:50 } +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 666/ 1625], loss: 1.153, per_step_time: 1474ms, lr: 1.22769225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42535 samples/s/p 6:22:59 } +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 668/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.2313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43427 samples/s/p 6:22:18 } +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 670/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2350769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43469 samples/s/p 6:22:14 } +2024-07-25 18:45:04,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 672/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.2387692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:04,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43174 samples/s/p 6:22:23 } +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 674/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.2424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43543 samples/s/p 6:22:05 } +2024-07-25 18:45:10,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 676/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.2461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:10,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43187 samples/s/p 6:22:17 } +2024-07-25 18:45:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 678/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2498461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43282 samples/s/p 6:22:10 } +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 680/ 1625], loss: 1.174, per_step_time: 1481ms, lr: 1.2535384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.40139 samples/s/p 6:24:20 } +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 682/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 1.2572307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43786 samples/s/p 6:21:43 } +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 684/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.2609231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43974 samples/s/p 6:21:32 } +2024-07-25 18:45:24,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 686/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:24,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43930 samples/s/p 6:21:31 } +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 688/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.2683076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43444 samples/s/p 6:21:48 } +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 690/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.2719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:30,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43549 samples/s/p 6:21:41 } +2024-07-25 18:45:33,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 692/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.2756923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:33,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43926 samples/s/p 6:21:22 } +2024-07-25 18:45:36,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 694/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.2793846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:36,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42943 samples/s/p 6:22:01 } +2024-07-25 18:45:39,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 696/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 1.2830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:39,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43612 samples/s/p 6:21:29 } +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 698/ 1625], loss: 1.554, per_step_time: 1472ms, lr: 1.2867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:42,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43140 samples/s/p 6:21:46 } +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 700/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 1.2904615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:45,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43971 samples/s/p 6:21:08 } +2024-07-25 18:45:48,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 702/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 1.29415375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:48,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.44018 samples/s/p 6:21:03 } +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 704/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.2978461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43203 samples/s/p 6:21:35 } +2024-07-25 18:45:54,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 706/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:54,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43604 samples/s/p 6:21:15 } +2024-07-25 18:45:57,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 708/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.3052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:57,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43104 samples/s/p 6:21:33 } +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 710/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.308923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43326 samples/s/p 6:21:21 } +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 712/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 1.3126153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43241 samples/s/p 6:21:21 } +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 714/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 1.3163076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43112 samples/s/p 6:21:24 } +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 716/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.32e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43679 samples/s/p 6:20:57 } +2024-07-25 18:46:12,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 718/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.3236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:12,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43662 samples/s/p 6:20:55 } +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 720/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 1.3273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42666 samples/s/p 6:21:34 } +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 722/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.3310769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42925 samples/s/p 6:21:20 } +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 724/ 1625], loss: 1.268, per_step_time: 1473ms, lr: 1.33476915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42767 samples/s/p 6:21:24 } +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 726/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.3384615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43650 samples/s/p 6:20:44 } +2024-07-25 18:46:26,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 728/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 1.3421538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:26,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43940 samples/s/p 6:20:28 } +2024-07-25 18:46:29,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 730/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 1.3458461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:29,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43873 samples/s/p 6:20:28 } +2024-07-25 18:46:32,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 732/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3495384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:32,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42898 samples/s/p 6:21:06 } +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 734/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.3532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43563 samples/s/p 6:20:36 } +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 736/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43743 samples/s/p 6:20:25 } +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 738/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.36061535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:41,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43231 samples/s/p 6:20:44 } +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 740/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 1.3643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43225 samples/s/p 6:20:41 } +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 742/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:47,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43790 samples/s/p 6:20:14 } +2024-07-25 18:46:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 744/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 1.3716922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:50,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43333 samples/s/p 6:20:30 } +2024-07-25 18:46:53,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 746/ 1625], loss: 1.155, per_step_time: 1469ms, lr: 1.3753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:53,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.44225 samples/s/p 6:19:50 } +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 748/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.3790768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43305 samples/s/p 6:20:26 } +2024-07-25 18:46:59,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 750/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3827692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:59,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43617 samples/s/p 6:20:10 } +2024-07-25 18:47:02,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 752/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.38646155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:02,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43885 samples/s/p 6:19:56 } +2024-07-25 18:47:05,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 754/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.3901537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:05,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43804 samples/s/p 6:19:56 } +2024-07-25 18:47:08,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 756/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.3938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:08,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43747 samples/s/p 6:19:55 } +2024-07-25 18:47:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 758/ 1625], loss: 1.241, per_step_time: 1480ms, lr: 1.3975384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.40310 samples/s/p 6:22:17 } +2024-07-25 18:47:14,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 760/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.40123075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.44038 samples/s/p 6:19:37 } +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 762/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.404923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43293 samples/s/p 6:20:06 } +2024-07-25 18:47:19,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 764/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 1.4086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:19,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43616 samples/s/p 6:19:49 } +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 766/ 1625], loss: 1.412, per_step_time: 1472ms, lr: 1.4123077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:22,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43301 samples/s/p 6:19:59 } +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 768/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.4159999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43206 samples/s/p 6:20:00 } +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 770/ 1625], loss: 1.398, per_step_time: 1473ms, lr: 1.4196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.42901 samples/s/p 6:20:10 } +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 772/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.4233846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:31,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43229 samples/s/p 6:19:54 } +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 774/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 1.4270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43550 samples/s/p 6:19:37 } +2024-07-25 18:47:37,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 776/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 1.4307692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:37,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.42449 samples/s/p 6:20:20 } +2024-07-25 18:47:40,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 778/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 1.4344614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:40,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43273 samples/s/p 6:19:43 } +2024-07-25 18:47:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 780/ 1625], loss: 1.282, per_step_time: 1470ms, lr: 1.4381538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:43,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43855 samples/s/p 6:19:16 } +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 782/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 1.44184605e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43400 samples/s/p 6:19:32 } +2024-07-25 18:47:49,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 784/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.4455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:49,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43702 samples/s/p 6:19:16 } +2024-07-25 18:47:52,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 786/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:52,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43188 samples/s/p 6:19:35 } +2024-07-25 18:47:55,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 788/ 1625], loss: 1.232, per_step_time: 1477ms, lr: 1.452923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:55,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.41477 samples/s/p 6:20:44 } +2024-07-25 18:47:58,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 790/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.4566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:58,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43246 samples/s/p 6:19:26 } +2024-07-25 18:48:01,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 792/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 1.4603076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:01,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43564 samples/s/p 6:19:10 } +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 794/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44107 samples/s/p 6:18:44 } +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 796/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.4676923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43270 samples/s/p 6:19:16 } +2024-07-25 18:48:10,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 798/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 1.4713845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:10,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43060 samples/s/p 6:19:22 } +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 800/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 1.4750769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44184 samples/s/p 6:18:32 } +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 802/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.4787692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43101 samples/s/p 6:19:15 } +2024-07-25 18:48:19,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 804/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 1.48246145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:19,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.42841 samples/s/p 6:19:23 } +2024-07-25 18:48:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 806/ 1625], loss: 1.011, per_step_time: 1470ms, lr: 1.4861538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:21,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43872 samples/s/p 6:18:37 } +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 808/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4898461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43376 samples/s/p 6:18:54 } +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 810/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 1.4935385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43316 samples/s/p 6:18:54 } +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 812/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.4972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43530 samples/s/p 6:18:42 } +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 814/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.500923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43671 samples/s/p 6:18:33 } +2024-07-25 18:48:36,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 816/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5046153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:36,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.44077 samples/s/p 6:18:13 } +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 818/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.50830765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43059 samples/s/p 6:18:53 } +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 820/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42855 samples/s/p 6:18:59 } +2024-07-25 18:48:45,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 822/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5156923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:45,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43520 samples/s/p 6:18:28 } +2024-07-25 18:48:48,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 824/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5193845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:48,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42910 samples/s/p 6:18:50 } +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 826/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.52307675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.44127 samples/s/p 6:17:57 } +2024-07-25 18:48:54,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 828/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.5267691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:54,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43141 samples/s/p 6:18:35 } +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 830/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.5304615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43455 samples/s/p 6:18:19 } +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 832/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5341539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43104 samples/s/p 6:18:30 } +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 834/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 1.537846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:03,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43889 samples/s/p 6:17:55 } +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 836/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.5415384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43030 samples/s/p 6:18:28 } +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 838/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5452308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43654 samples/s/p 6:17:59 } +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 840/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.5489231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43340 samples/s/p 6:18:09 } +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 842/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.5526153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43876 samples/s/p 6:17:43 } +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 844/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.5563075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43630 samples/s/p 6:17:51 } +2024-07-25 18:49:21,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 846/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.5599999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:21,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43823 samples/s/p 6:17:40 } +2024-07-25 18:49:23,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 848/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5636922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:23,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43737 samples/s/p 6:17:40 } +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 850/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.5673846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43404 samples/s/p 6:17:51 } +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 852/ 1625], loss: 1.398, per_step_time: 1470ms, lr: 1.571077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.44196 samples/s/p 6:17:15 } +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 854/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.5747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:32,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43209 samples/s/p 6:17:54 } +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 856/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 1.5784615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42607 samples/s/p 6:18:16 } +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 858/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 1.5821537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:38,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44119 samples/s/p 6:17:10 } +2024-07-25 18:49:41,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 860/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.585846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:41,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44582 samples/s/p 6:16:48 } +2024-07-25 18:49:44,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 862/ 1625], loss: 1.296, per_step_time: 1480ms, lr: 1.5895384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:44,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.40508 samples/s/p 6:19:35 } +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 864/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 1.5932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42970 samples/s/p 6:17:49 } +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 866/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43356 samples/s/p 6:17:30 } +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 868/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6006154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43621 samples/s/p 6:17:16 } +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 870/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.6043077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:56,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43950 samples/s/p 6:16:59 } +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 872/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43392 samples/s/p 6:17:20 } +2024-07-25 18:50:02,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 874/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:02,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43498 samples/s/p 6:17:12 } +2024-07-25 18:50:05,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.6153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:05,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44090 samples/s/p 6:16:45 } +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 878/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.6190768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.42754 samples/s/p 6:17:37 } +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 880/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.6227692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43104 samples/s/p 6:17:20 } +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 882/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44044 samples/s/p 6:16:38 } +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 884/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.6301537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43296 samples/s/p 6:17:06 } +2024-07-25 18:50:20,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 886/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.6338461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:20,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.44140 samples/s/p 6:16:28 } +2024-07-25 18:50:22,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 888/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.6375385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:22,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42957 samples/s/p 6:17:14 } +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 890/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.6412308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43461 samples/s/p 6:16:50 } +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 892/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.6449228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:28,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43792 samples/s/p 6:16:33 } +2024-07-25 18:50:31,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 894/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.6486152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:31,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43291 samples/s/p 6:16:51 } +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 896/ 1625], loss: 1.447, per_step_time: 1474ms, lr: 1.6523076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:34,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42427 samples/s/p 6:17:24 } +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 898/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 1.656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:37,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43625 samples/s/p 6:16:32 } +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 900/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.6596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43633 samples/s/p 6:16:28 } +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 902/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:43,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43422 samples/s/p 6:16:34 } +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 904/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 1.6670769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.44037 samples/s/p 6:16:06 } +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 906/ 1625], loss: 1.376, per_step_time: 1470ms, lr: 1.6707692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:49,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43929 samples/s/p 6:16:07 } +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 908/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6744614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:52,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43836 samples/s/p 6:16:08 } +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 910/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43435 samples/s/p 6:16:22 } +2024-07-25 18:50:58,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 912/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.681846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:58,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43619 samples/s/p 6:16:11 } +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 914/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.6855383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:01,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.44019 samples/s/p 6:15:52 } +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 916/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.6892307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43231 samples/s/p 6:16:21 } +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 918/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.692923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:07,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43618 samples/s/p 6:16:02 } +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 920/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.6966154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43220 samples/s/p 6:16:16 } +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 922/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.7003076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43487 samples/s/p 6:16:02 } +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 924/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 1.704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43125 samples/s/p 6:16:14 } +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 926/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.7076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:19,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43785 samples/s/p 6:15:44 } +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 928/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.7113845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43590 samples/s/p 6:15:49 } +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 930/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 1.7150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.44017 samples/s/p 6:15:28 } +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 932/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.718769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43952 samples/s/p 6:15:28 } +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 934/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 1.7224615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43652 samples/s/p 6:15:37 } +2024-07-25 18:51:33,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 936/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.7261538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:33,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43420 samples/s/p 6:15:44 } +2024-07-25 18:51:36,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 938/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.7298462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:36,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43064 samples/s/p 6:15:56 } +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 940/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 1.7335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:39,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43511 samples/s/p 6:15:34 } +2024-07-25 18:51:42,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 942/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.7372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:42,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43827 samples/s/p 6:15:18 } +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 944/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.740923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43592 samples/s/p 6:15:25 } +2024-07-25 18:51:48,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 946/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.7446153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:48,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43143 samples/s/p 6:15:41 } +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 948/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.7483077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43416 samples/s/p 6:15:27 } +2024-07-25 18:51:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 950/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.7519998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:54,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42783 samples/s/p 6:15:50 } +2024-07-25 18:51:57,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 952/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 1.7556922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:57,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.44131 samples/s/p 6:14:51 } +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 954/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.7593846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:00,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43276 samples/s/p 6:15:24 } +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 956/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:03,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43892 samples/s/p 6:14:55 } +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 958/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.7667691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43525 samples/s/p 6:15:07 } +2024-07-25 18:52:09,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 960/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.7704613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:09,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43035 samples/s/p 6:15:25 } +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 962/ 1625], loss: 0.985, per_step_time: 1470ms, lr: 1.7741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43964 samples/s/p 6:14:43 } +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 964/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.777846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:15,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43296 samples/s/p 6:15:08 } +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 966/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.7815384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43520 samples/s/p 6:14:56 } +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 968/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.7852308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43761 samples/s/p 6:14:43 } +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 970/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.788923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:23,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43205 samples/s/p 6:15:03 } +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 972/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.7926153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43149 samples/s/p 6:15:02 } +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 974/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.7963077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43045 samples/s/p 6:15:04 } +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 976/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.7999999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.43118 samples/s/p 6:14:58 } +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.8036922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.44207 samples/s/p 6:14:10 } +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 980/ 1625], loss: 1.142, per_step_time: 1482ms, lr: 1.8073844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.39657 samples/s/p 6:17:16 } +2024-07-25 18:52:41,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 982/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 1.8110768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:41,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.42876 samples/s/p 6:14:59 } +2024-07-25 18:52:44,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 984/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.8147692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:44,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43486 samples/s/p 6:14:31 } +2024-07-25 18:52:47,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 986/ 1625], loss: 1.310, per_step_time: 1470ms, lr: 1.8184615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.44020 samples/s/p 6:14:06 } +2024-07-25 18:52:50,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 988/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.8221539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:50,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43520 samples/s/p 6:14:23 } +2024-07-25 18:52:53,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 990/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.825846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43331 samples/s/p 6:14:28 } +2024-07-25 18:52:56,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 992/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.8295383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:56,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43294 samples/s/p 6:14:27 } +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 994/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.8332306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43721 samples/s/p 6:14:06 } +2024-07-25 18:53:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 996/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43057 samples/s/p 6:14:31 } +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 998/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.8406154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43557 samples/s/p 6:14:07 } +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1000/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.8443076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43868 samples/s/p 6:13:51 } +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1002/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43340 samples/s/p 6:14:10 } +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1004/ 1625], loss: 1.311, per_step_time: 1474ms, lr: 1.8516923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.42667 samples/s/p 6:14:35 } +2024-07-25 18:53:17,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1006/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.8553847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:17,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43215 samples/s/p 6:14:10 } +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1008/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.859077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43352 samples/s/p 6:14:01 } +2024-07-25 18:53:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1010/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.862769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43564 samples/s/p 6:13:49 } +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1012/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 1.8664614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43991 samples/s/p 6:13:29 } +2024-07-25 18:53:28,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1014/ 1625], loss: 1.070, per_step_time: 1469ms, lr: 1.8701538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:28,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.44298 samples/s/p 6:13:13 } +2024-07-25 18:53:31,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1016/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.8738461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43906 samples/s/p 6:13:26 } +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1018/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.8775383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43090 samples/s/p 6:13:57 } +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1020/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.8812307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43668 samples/s/p 6:13:30 } +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1022/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.884923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:40,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43054 samples/s/p 6:13:53 } +2024-07-25 18:53:43,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1024/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 1.8886154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43190 samples/s/p 6:13:44 } +2024-07-25 18:53:46,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1026/ 1625], loss: 1.394, per_step_time: 1470ms, lr: 1.8923076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:46,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.44152 samples/s/p 6:13:01 } +2024-07-25 18:53:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1028/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.8959998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:49,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43810 samples/s/p 6:13:13 } +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1030/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.8996921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:52,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43538 samples/s/p 6:13:21 } +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1032/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.9033845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43549 samples/s/p 6:13:17 } +2024-07-25 18:53:58,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1034/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.9070769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:58,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43613 samples/s/p 6:13:12 } +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1036/ 1625], loss: 1.235, per_step_time: 1476ms, lr: 1.9107692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.41773 samples/s/p 6:14:25 } +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1038/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 1.9144614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42412 samples/s/p 6:13:56 } +2024-07-25 18:54:07,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1040/ 1625], loss: 1.367, per_step_time: 1473ms, lr: 1.9181538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:07,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43096 samples/s/p 6:13:24 } +2024-07-25 18:54:10,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1042/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.921846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:10,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43099 samples/s/p 6:13:21 } +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1044/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 1.9255383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42794 samples/s/p 6:13:31 } +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1046/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 1.9292307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42873 samples/s/p 6:13:25 } +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1048/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.9329229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43652 samples/s/p 6:12:50 } +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1050/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.9366153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43675 samples/s/p 6:12:46 } +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1052/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.9403076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43539 samples/s/p 6:12:48 } +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1054/ 1625], loss: 1.456, per_step_time: 1473ms, lr: 1.944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43068 samples/s/p 6:13:05 } +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1056/ 1625], loss: 0.973, per_step_time: 1474ms, lr: 1.9476924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:30,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42676 samples/s/p 6:13:18 } +2024-07-25 18:54:33,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1058/ 1625], loss: 1.146, per_step_time: 1469ms, lr: 1.9513845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:33,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44241 samples/s/p 6:12:11 } +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1060/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.9550767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44091 samples/s/p 6:12:14 } +2024-07-25 18:54:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1062/ 1625], loss: 1.185, per_step_time: 1474ms, lr: 1.9587691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:39,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42647 samples/s/p 6:13:11 } +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1064/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.9624615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43554 samples/s/p 6:12:30 } +2024-07-25 18:54:45,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1066/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9661538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43946 samples/s/p 6:12:11 } +2024-07-25 18:54:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1068/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.969846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.42902 samples/s/p 6:12:51 } +2024-07-25 18:54:51,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1070/ 1625], loss: 1.237, per_step_time: 1470ms, lr: 1.9735384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:51,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.44174 samples/s/p 6:11:56 } +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1072/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.9772307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:54,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43460 samples/s/p 6:12:22 } +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1074/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.9809231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43694 samples/s/p 6:12:10 } +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1076/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 1.9846153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43697 samples/s/p 6:12:07 } +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1078/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.9883075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43266 samples/s/p 6:12:21 } +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1080/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.9919999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43369 samples/s/p 6:12:14 } +2024-07-25 18:55:09,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1082/ 1625], loss: 1.403, per_step_time: 1472ms, lr: 1.9956922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:09,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43278 samples/s/p 6:12:15 } +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1084/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.9993846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43357 samples/s/p 6:12:09 } +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1086/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.0030768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42902 samples/s/p 6:12:25 } +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1088/ 1625], loss: 1.225, per_step_time: 1474ms, lr: 2.0067691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42579 samples/s/p 6:12:35 } +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1090/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0104615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43137 samples/s/p 6:12:09 } +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1092/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.0141539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:24,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43815 samples/s/p 6:11:38 } +2024-07-25 18:55:27,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1094/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.017846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:27,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43033 samples/s/p 6:12:07 } +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1096/ 1625], loss: 1.179, per_step_time: 1474ms, lr: 2.0215382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:29,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42622 samples/s/p 6:12:21 } +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1098/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.0252306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43681 samples/s/p 6:11:35 } +2024-07-25 18:55:35,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1100/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.028923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:35,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43306 samples/s/p 6:11:47 } +2024-07-25 18:55:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1102/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.0326153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:38,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43550 samples/s/p 6:11:34 } +2024-07-25 18:55:41,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1104/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.0363077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:41,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.44091 samples/s/p 6:11:09 } +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1106/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.0399999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43392 samples/s/p 6:11:35 } +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1108/ 1625], loss: 1.259, per_step_time: 1477ms, lr: 2.0436923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.41541 samples/s/p 6:12:48 } +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1110/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.0473844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43289 samples/s/p 6:11:33 } +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1112/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0510768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43061 samples/s/p 6:11:40 } +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1114/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.0547692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42799 samples/s/p 6:11:48 } +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1116/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.0584614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:59,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43378 samples/s/p 6:11:21 } +2024-07-25 18:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1118/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.0621537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:02,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43404 samples/s/p 6:11:17 } +2024-07-25 18:56:05,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1120/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 2.0658461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:05,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42566 samples/s/p 6:11:48 } +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1122/ 1625], loss: 1.272, per_step_time: 1475ms, lr: 2.0695385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42126 samples/s/p 6:12:03 } +2024-07-25 18:56:11,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1124/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0732308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:11,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43761 samples/s/p 6:10:53 } +2024-07-25 18:56:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1126/ 1625], loss: 1.313, per_step_time: 1471ms, lr: 2.0769228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:14,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43636 samples/s/p 6:10:56 } +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1128/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 2.0806152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42988 samples/s/p 6:11:19 } +2024-07-25 18:56:20,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1130/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0843076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:20,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43858 samples/s/p 6:10:41 } +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1132/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43649 samples/s/p 6:10:46 } +2024-07-25 18:56:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1134/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.0916923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43506 samples/s/p 6:10:49 } +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1136/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.0953845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43241 samples/s/p 6:10:57 } +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1138/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0990768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:31,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43077 samples/s/p 6:11:01 } +2024-07-25 18:56:34,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1140/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.1027692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:34,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43589 samples/s/p 6:10:37 } +2024-07-25 18:56:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1142/ 1625], loss: 1.185, per_step_time: 1474ms, lr: 2.1064616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42733 samples/s/p 6:11:09 } +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1144/ 1625], loss: 1.341, per_step_time: 1473ms, lr: 2.1101538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:40,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42825 samples/s/p 6:11:02 } +2024-07-25 18:56:43,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1146/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:43,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43420 samples/s/p 6:10:35 } +2024-07-25 18:56:46,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1148/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 2.1175383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:46,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43050 samples/s/p 6:10:47 } +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1150/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.1212307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:49,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42794 samples/s/p 6:10:55 } +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1152/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.124923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:52,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43297 samples/s/p 6:10:31 } +2024-07-25 18:56:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1154/ 1625], loss: 0.892, per_step_time: 1471ms, lr: 2.1286154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43817 samples/s/p 6:10:07 } +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1156/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.1323076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:58,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43525 samples/s/p 6:10:16 } +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1158/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:01,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43148 samples/s/p 6:10:28 } +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1160/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.1396922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43388 samples/s/p 6:10:16 } +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1162/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 2.1433845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.44414 samples/s/p 6:09:31 } +2024-07-25 18:57:10,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1164/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.1470767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43705 samples/s/p 6:09:57 } +2024-07-25 18:57:13,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1166/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:13,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43267 samples/s/p 6:10:12 } +2024-07-25 18:57:16,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1168/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.1544614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:16,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43547 samples/s/p 6:09:57 } +2024-07-25 18:57:19,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1170/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.1581538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:19,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43603 samples/s/p 6:09:52 } +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1172/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 2.1618462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.41736 samples/s/p 6:11:06 } +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1174/ 1625], loss: 1.450, per_step_time: 1470ms, lr: 2.1655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:25,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43950 samples/s/p 6:09:32 } +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1176/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.1692307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43144 samples/s/p 6:10:02 } +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1178/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1729229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:31,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43590 samples/s/p 6:09:41 } +2024-07-25 18:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1180/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.1766153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:33,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43289 samples/s/p 6:09:50 } +2024-07-25 18:57:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1182/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.1803076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43819 samples/s/p 6:09:26 } +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1184/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.1839998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42939 samples/s/p 6:09:59 } +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1186/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 2.1876922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43055 samples/s/p 6:09:51 } +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1188/ 1625], loss: 1.028, per_step_time: 1475ms, lr: 2.1913846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42267 samples/s/p 6:10:20 } +2024-07-25 18:57:48,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1190/ 1625], loss: 1.326, per_step_time: 1470ms, lr: 2.195077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:48,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.44107 samples/s/p 6:09:02 } +2024-07-25 18:57:51,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1192/ 1625], loss: 1.019, per_step_time: 1474ms, lr: 2.1987693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:51,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42576 samples/s/p 6:10:02 } +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1194/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 2.2024613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43394 samples/s/p 6:09:25 } +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1196/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.2061537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43777 samples/s/p 6:09:07 } +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1198/ 1625], loss: 0.908, per_step_time: 1471ms, lr: 2.209846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43784 samples/s/p 6:09:04 } +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1200/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.2135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:03,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43619 samples/s/p 6:09:07 } +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1202/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.2172308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43145 samples/s/p 6:09:24 } +2024-07-25 18:58:09,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1204/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 2.220923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:09,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.42964 samples/s/p 6:09:28 } +2024-07-25 18:58:12,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1206/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.2246153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:12,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43567 samples/s/p 6:09:01 } +2024-07-25 18:58:15,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1208/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.2283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:15,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43243 samples/s/p 6:09:11 } +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1210/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.2319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:18,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43531 samples/s/p 6:08:56 } +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1212/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.2356922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.44237 samples/s/p 6:08:25 } +2024-07-25 18:58:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1214/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.2393844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43322 samples/s/p 6:08:59 } +2024-07-25 18:58:27,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1216/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.2430768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:27,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43910 samples/s/p 6:08:32 } +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1218/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.2467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:30,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43356 samples/s/p 6:08:52 } +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1220/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.2504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43990 samples/s/p 6:08:23 } +2024-07-25 18:58:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1222/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.2541539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43377 samples/s/p 6:08:45 } +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1224/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.257846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:38,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43033 samples/s/p 6:08:56 } +2024-07-25 18:58:41,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1226/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.2615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:41,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43623 samples/s/p 6:08:29 } +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1228/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.2652306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:44,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43640 samples/s/p 6:08:25 } +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1230/ 1625], loss: 1.198, per_step_time: 1474ms, lr: 2.268923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:47,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.42584 samples/s/p 6:09:05 } +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1232/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2726152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43360 samples/s/p 6:08:31 } +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1234/ 1625], loss: 1.409, per_step_time: 1471ms, lr: 2.2763075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43504 samples/s/p 6:08:22 } +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1236/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2799999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43808 samples/s/p 6:08:07 } +2024-07-25 18:58:59,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1238/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 2.2836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:59,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43598 samples/s/p 6:08:12 } +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1240/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.2873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43822 samples/s/p 6:08:00 } +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.2910768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:05,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43630 samples/s/p 6:08:05 } +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1244/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.294769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.44108 samples/s/p 6:07:43 } +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1246/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2984614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.42916 samples/s/p 6:08:28 } +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1248/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.3021537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:14,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43402 samples/s/p 6:08:06 } +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1250/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3058461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43553 samples/s/p 6:07:56 } +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1252/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43290 samples/s/p 6:08:04 } +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1254/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.3132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43653 samples/s/p 6:07:47 } +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1256/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43198 samples/s/p 6:08:02 } +2024-07-25 18:59:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1258/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.3206154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43553 samples/s/p 6:07:45 } +2024-07-25 18:59:32,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1260/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.3243078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:32,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42557 samples/s/p 6:08:22 } +2024-07-25 18:59:34,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1262/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3279998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43085 samples/s/p 6:07:58 } +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1264/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.3316921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43623 samples/s/p 6:07:33 } +2024-07-25 18:59:40,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1266/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.3353845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:40,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43925 samples/s/p 6:07:18 } +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1268/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.3390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.44124 samples/s/p 6:07:07 } +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.3427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:46,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43391 samples/s/p 6:07:34 } +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1272/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3464614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43601 samples/s/p 6:07:22 } +2024-07-25 18:59:52,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1274/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.3501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:52,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43094 samples/s/p 6:07:40 } +2024-07-25 18:59:55,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1276/ 1625], loss: 1.259, per_step_time: 1475ms, lr: 2.3538461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:55,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42240 samples/s/p 6:08:12 } +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1278/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.3575383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44106 samples/s/p 6:06:53 } +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1280/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 2.3612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44038 samples/s/p 6:06:53 } +2024-07-25 19:00:04,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1282/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.3649229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43216 samples/s/p 6:07:23 } +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1284/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 2.3686152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43865 samples/s/p 6:06:54 } +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1286/ 1625], loss: 0.877, per_step_time: 1471ms, lr: 2.3723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:10,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43592 samples/s/p 6:07:02 } +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1288/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43573 samples/s/p 6:07:00 } +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1290/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.3796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:16,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43134 samples/s/p 6:07:15 } +2024-07-25 19:00:19,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1292/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 2.3833845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:19,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43038 samples/s/p 6:07:16 } +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1294/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.3870767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:22,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43165 samples/s/p 6:07:07 } +2024-07-25 19:00:25,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1296/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43856 samples/s/p 6:06:37 } +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1298/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.3944614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:28,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43708 samples/s/p 6:06:40 } +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1300/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 2.3981538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.44528 samples/s/p 6:06:03 } +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1302/ 1625], loss: 1.347, per_step_time: 1472ms, lr: 2.401846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43197 samples/s/p 6:06:54 } +2024-07-25 19:00:36,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1304/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 2.4055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.42451 samples/s/p 6:07:22 } +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1306/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.4092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43113 samples/s/p 6:06:52 } +2024-07-25 19:00:42,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1308/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.4129231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43708 samples/s/p 6:06:25 } +2024-07-25 19:00:45,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1310/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.4166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:45,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.42929 samples/s/p 6:06:53 } +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1312/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.4203075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44181 samples/s/p 6:06:00 } +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1314/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.4239998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44201 samples/s/p 6:05:56 } +2024-07-25 19:00:54,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1316/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.4276922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43574 samples/s/p 6:06:18 } +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1318/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.4313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43221 samples/s/p 6:06:30 } +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1320/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.4350767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43489 samples/s/p 6:06:16 } +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1322/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.4387691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:03,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43411 samples/s/p 6:06:16 } +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1324/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.4424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43180 samples/s/p 6:06:23 } +2024-07-25 19:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1326/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 2.4461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43230 samples/s/p 6:06:18 } +2024-07-25 19:01:12,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1328/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.449846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43521 samples/s/p 6:06:03 } +2024-07-25 19:01:15,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1330/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.4535382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:15,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44175 samples/s/p 6:05:34 } +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1332/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.4572306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:18,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43766 samples/s/p 6:05:47 } +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1334/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.460923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:21,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43359 samples/s/p 6:06:01 } +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1336/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.4646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:24,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43672 samples/s/p 6:05:45 } +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1338/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.4683077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44151 samples/s/p 6:05:23 } +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1340/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.4719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43418 samples/s/p 6:05:49 } +2024-07-25 19:01:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1342/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.4756922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:33,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43517 samples/s/p 6:05:43 } +2024-07-25 19:01:35,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1344/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.4793844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:35,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43273 samples/s/p 6:05:49 } +2024-07-25 19:01:38,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:38,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43508 samples/s/p 6:05:37 } +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1348/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.4867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43411 samples/s/p 6:05:38 } +2024-07-25 19:01:44,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1350/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.4904613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43536 samples/s/p 6:05:30 } +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1352/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4941537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43462 samples/s/p 6:05:30 } +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1354/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.497846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43746 samples/s/p 6:05:16 } +2024-07-25 19:01:53,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1356/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.5015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43543 samples/s/p 6:05:21 } +2024-07-25 19:01:56,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1358/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 2.5052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:56,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43368 samples/s/p 6:05:25 } +2024-07-25 19:01:59,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1360/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.508923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:59,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43417 samples/s/p 6:05:20 } +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1362/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.5126152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43467 samples/s/p 6:05:15 } +2024-07-25 19:02:05,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1364/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5163075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:05,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43814 samples/s/p 6:04:58 } +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1366/ 1625], loss: 1.220, per_step_time: 1474ms, lr: 2.5199999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.42714 samples/s/p 6:05:40 } +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1368/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.5236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43447 samples/s/p 6:05:07 } +2024-07-25 19:02:14,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1370/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.5273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:14,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43866 samples/s/p 6:04:47 } +2024-07-25 19:02:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1372/ 1625], loss: 1.337, per_step_time: 1470ms, lr: 2.5310768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43865 samples/s/p 6:04:44 } +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1374/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.5347692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:20,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43319 samples/s/p 6:05:03 } +2024-07-25 19:02:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1376/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 2.5384616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43859 samples/s/p 6:04:39 } +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1378/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.5421536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42810 samples/s/p 6:05:18 } +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1380/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.545846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43527 samples/s/p 6:04:46 } +2024-07-25 19:02:32,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1382/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.5495383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:32,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43423 samples/s/p 6:04:47 } +2024-07-25 19:02:34,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1384/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.5532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:34,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42811 samples/s/p 6:05:09 } +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1386/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.556923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:37,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42934 samples/s/p 6:05:01 } +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1388/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 2.5606152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42567 samples/s/p 6:05:13 } +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1390/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.5643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43740 samples/s/p 6:04:23 } +2024-07-25 19:02:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1392/ 1625], loss: 1.372, per_step_time: 1471ms, lr: 2.568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43528 samples/s/p 6:04:28 } +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1394/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 2.5716923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:49,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43876 samples/s/p 6:04:12 } +2024-07-25 19:02:52,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1396/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43830 samples/s/p 6:04:10 } +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1398/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.5790767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:55,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.44105 samples/s/p 6:03:56 } +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1400/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.582769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:58,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43562 samples/s/p 6:04:15 } +2024-07-25 19:02:58,593 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:03:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1402/ 1625], loss: 1.293, per_step_time: 1475ms, lr: 2.5864614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.42265 samples/s/p 6:05:05 } +2024-07-25 19:03:38,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1404/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.5901538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:38,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43304 samples/s/p 6:04:20 } +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1406/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.5938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43579 samples/s/p 6:04:06 } +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1408/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5975383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43882 samples/s/p 6:03:51 } +2024-07-25 19:03:47,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1410/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6012307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:47,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43674 samples/s/p 6:03:56 } +2024-07-25 19:03:50,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1412/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.6049229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:50,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43603 samples/s/p 6:03:56 } +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1414/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.6086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43005 samples/s/p 6:04:17 } +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1416/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.6123076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43817 samples/s/p 6:03:42 } +2024-07-25 19:03:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1418/ 1625], loss: 1.287, per_step_time: 1473ms, lr: 2.6159998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43085 samples/s/p 6:04:08 } +2024-07-25 19:04:01,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1420/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.6196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:01,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.42911 samples/s/p 6:04:12 } +2024-07-25 19:04:04,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1422/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.6233845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43437 samples/s/p 6:03:48 } +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1424/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.6270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43237 samples/s/p 6:03:53 } +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1426/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6307693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.42939 samples/s/p 6:04:02 } +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 2.6344613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43877 samples/s/p 6:03:21 } +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1430/ 1625], loss: 1.287, per_step_time: 1470ms, lr: 2.6381536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:16,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44210 samples/s/p 6:03:05 } +2024-07-25 19:04:19,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1432/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.641846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:19,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44195 samples/s/p 6:03:03 } +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1434/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.6455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:22,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43138 samples/s/p 6:03:42 } +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1436/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:25,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44072 samples/s/p 6:03:02 } +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1438/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.652923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44145 samples/s/p 6:02:56 } +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1440/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.6566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:31,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43443 samples/s/p 6:03:21 } +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1442/ 1625], loss: 1.485, per_step_time: 1471ms, lr: 2.6603077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:34,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43672 samples/s/p 6:03:09 } +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1444/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43270 samples/s/p 6:03:22 } +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1446/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.6676922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:40,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43177 samples/s/p 6:03:23 } +2024-07-25 19:04:43,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1448/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6713844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:43,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43360 samples/s/p 6:03:13 } +2024-07-25 19:04:46,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1450/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.6750768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:46,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43805 samples/s/p 6:02:52 } +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1452/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 2.6787691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:49,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.42993 samples/s/p 6:03:22 } +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1454/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.6824615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43370 samples/s/p 6:03:04 } +2024-07-25 19:04:55,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1456/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.6861537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:55,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43251 samples/s/p 6:03:05 } +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1458/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.689846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43071 samples/s/p 6:03:10 } +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1460/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6935384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43753 samples/s/p 6:02:39 } +2024-07-25 19:05:03,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1462/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.6972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:03,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44126 samples/s/p 6:02:22 } +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1464/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.700923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44149 samples/s/p 6:02:18 } +2024-07-25 19:05:09,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1466/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.7046151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:09,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43925 samples/s/p 6:02:24 } +2024-07-25 19:05:12,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1468/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.7083075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43323 samples/s/p 6:02:45 } +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1470/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.7119999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43578 samples/s/p 6:02:32 } +2024-07-25 19:05:18,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1472/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 2.7156922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:18,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42988 samples/s/p 6:02:52 } +2024-07-25 19:05:21,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1474/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 2.7193846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:21,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43152 samples/s/p 6:02:43 } +2024-07-25 19:05:24,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1476/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.7230768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:24,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43827 samples/s/p 6:02:13 } +2024-07-25 19:05:27,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1478/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.7267692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:27,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42543 samples/s/p 6:03:01 } +2024-07-25 19:05:30,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1480/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.7304613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:30,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43508 samples/s/p 6:02:20 } +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1482/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.7341537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43420 samples/s/p 6:02:20 } +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1484/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.737846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42920 samples/s/p 6:02:37 } +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1486/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.7415383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42897 samples/s/p 6:02:35 } +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1488/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.7452306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43346 samples/s/p 6:02:14 } +2024-07-25 19:05:45,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1490/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.748923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:45,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43569 samples/s/p 6:02:03 } +2024-07-25 19:05:48,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1492/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.7526154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:48,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43285 samples/s/p 6:02:11 } +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1494/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.7563077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43435 samples/s/p 6:02:02 } +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1496/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7599997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43426 samples/s/p 6:01:59 } +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1498/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7636921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43266 samples/s/p 6:02:03 } +2024-07-25 19:06:00,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1500/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.7673845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:00,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43381 samples/s/p 6:01:55 } +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1502/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.7710768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43302 samples/s/p 6:01:56 } +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1504/ 1625], loss: 1.168, per_step_time: 1474ms, lr: 2.7747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:05,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42624 samples/s/p 6:02:20 } +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1506/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.7784614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43762 samples/s/p 6:01:31 } +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1508/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.7821538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43422 samples/s/p 6:01:42 } +2024-07-25 19:06:14,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1510/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 2.7858461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:14,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43075 samples/s/p 6:01:53 } +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1512/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7895383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:17,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43396 samples/s/p 6:01:37 } +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1514/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.7932307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:20,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43432 samples/s/p 6:01:33 } +2024-07-25 19:06:23,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1516/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.7969229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:23,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42859 samples/s/p 6:01:53 } +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1518/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8006152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.44035 samples/s/p 6:01:03 } +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1520/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8043076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43408 samples/s/p 6:01:25 } +2024-07-25 19:06:32,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:32,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43224 samples/s/p 6:01:29 } +2024-07-25 19:06:35,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1524/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 2.8116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:35,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43424 samples/s/p 6:01:18 } +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1526/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.8153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42712 samples/s/p 6:01:44 } +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1528/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8190769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:41,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43434 samples/s/p 6:01:12 } +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1530/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.822769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43905 samples/s/p 6:00:50 } +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1532/ 1625], loss: 1.023, per_step_time: 1473ms, lr: 2.8264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:47,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43014 samples/s/p 6:01:23 } +2024-07-25 19:06:50,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1534/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.8301536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:50,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43652 samples/s/p 6:00:55 } +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1536/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43983 samples/s/p 6:00:38 } +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1538/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.8375383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:56,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43848 samples/s/p 6:00:41 } +2024-07-25 19:06:59,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1540/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.8412307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43517 samples/s/p 6:00:51 } +2024-07-25 19:07:02,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1542/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.844923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:02,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43179 samples/s/p 6:01:02 } +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1544/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8486153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43235 samples/s/p 6:00:56 } +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1546/ 1625], loss: 0.967, per_step_time: 1475ms, lr: 2.8523074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:07,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.42331 samples/s/p 6:01:30 } +2024-07-25 19:07:10,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1548/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8559998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43380 samples/s/p 6:00:45 } +2024-07-25 19:07:13,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1550/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.8596922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:13,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43077 samples/s/p 6:00:54 } +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1552/ 1625], loss: 1.156, per_step_time: 1470ms, lr: 2.8633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:16,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43848 samples/s/p 6:00:20 } +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1554/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.8670767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43195 samples/s/p 6:00:43 } +2024-07-25 19:07:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1556/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.8707691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42852 samples/s/p 6:00:54 } +2024-07-25 19:07:25,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1558/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.8744615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:25,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43411 samples/s/p 6:00:29 } +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1560/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43649 samples/s/p 6:00:16 } +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1562/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8818462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43257 samples/s/p 6:00:29 } +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1564/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8855382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:34,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43590 samples/s/p 6:00:13 } +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1566/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.8892306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42641 samples/s/p 6:00:48 } +2024-07-25 19:07:40,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1568/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.892923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:40,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43175 samples/s/p 6:00:23 } +2024-07-25 19:07:43,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1570/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.8966153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:43,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.42650 samples/s/p 6:00:41 } +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1572/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 2.9003077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43133 samples/s/p 6:00:19 } +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1574/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.9039998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:49,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43728 samples/s/p 5:59:53 } +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1576/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:52,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43322 samples/s/p 6:00:06 } +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1578/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43369 samples/s/p 6:00:01 } +2024-07-25 19:07:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1580/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.9150768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:58,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43960 samples/s/p 5:59:35 } +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1582/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.9187691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:01,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43735 samples/s/p 5:59:41 } +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1584/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9224613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43592 samples/s/p 5:59:43 } +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1586/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 2.9261537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:06,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43799 samples/s/p 5:59:32 } +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1588/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.929846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43717 samples/s/p 5:59:32 } +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1590/ 1625], loss: 1.431, per_step_time: 1471ms, lr: 2.9335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43654 samples/s/p 5:59:32 } +2024-07-25 19:08:15,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:15,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43280 samples/s/p 5:59:44 } +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1594/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.940923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43515 samples/s/p 5:59:32 } +2024-07-25 19:08:21,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1596/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 2.9446152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:21,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.42009 samples/s/p 6:00:29 } +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1598/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 2.9483075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.44283 samples/s/p 5:58:55 } +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1600/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.9519999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43762 samples/s/p 5:59:13 } +2024-07-25 19:08:30,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1602/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.955692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43058 samples/s/p 5:59:38 } +2024-07-25 19:08:33,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1604/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.9593844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42647 samples/s/p 5:59:51 } +2024-07-25 19:08:36,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1606/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.9630768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:36,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43524 samples/s/p 5:59:14 } +2024-07-25 19:08:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1608/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9667692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43162 samples/s/p 5:59:25 } +2024-07-25 19:08:42,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1610/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.9704615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:42,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42415 samples/s/p 5:59:52 } +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1612/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43746 samples/s/p 5:58:56 } +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1614/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.9778459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43452 samples/s/p 5:59:05 } +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1616/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9815383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43113 samples/s/p 5:59:15 } +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1618/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9852306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.44123 samples/s/p 5:58:32 } +2024-07-25 19:08:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1620/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.988923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43194 samples/s/p 5:59:06 } +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1622/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9926152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:00,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43690 samples/s/p 5:58:44 } +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1624/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 2.9963076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43405 samples/s/p 5:58:52 } +2024-07-25 19:09:06,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1478ms, lr: 3e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:06,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.41104 samples/s/p 6:00:20 } +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 3/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 2.9999997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43966 samples/s/p 5:58:24 } +2024-07-25 19:09:11,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 5/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.9999994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:11,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43443 samples/s/p 5:58:42 } +2024-07-25 19:09:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 7/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.9999987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:14,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43297 samples/s/p 5:58:44 } +2024-07-25 19:09:17,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 9/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.999998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:17,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43529 samples/s/p 5:58:32 } +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 11/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 2.9999967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43074 samples/s/p 5:58:47 } +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 13/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.9999952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43325 samples/s/p 5:58:34 } +2024-07-25 19:09:26,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 15/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9999934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43531 samples/s/p 5:58:23 } +2024-07-25 19:09:29,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 17/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9999912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:29,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43472 samples/s/p 5:58:23 } +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 19/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.999989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43638 samples/s/p 5:58:13 } +2024-07-25 19:09:35,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 21/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.9999865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:35,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43454 samples/s/p 5:58:18 } +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 23/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.9999837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43960 samples/s/p 5:57:55 } +2024-07-25 19:09:41,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 25/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9999806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:41,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43830 samples/s/p 5:57:57 } +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 27/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9999774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43670 samples/s/p 5:58:00 } +2024-07-25 19:09:47,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 29/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.9999737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:47,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43766 samples/s/p 5:57:53 } +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 31/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.99997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43760 samples/s/p 5:57:51 } +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 33/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9999657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43487 samples/s/p 5:57:59 } +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 35/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.9999612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43845 samples/s/p 5:57:41 } +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 37/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9999566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43812 samples/s/p 5:57:40 } +2024-07-25 19:10:02,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 39/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.9999517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:02,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.44184 samples/s/p 5:57:22 } +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 41/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 2.9999464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:05,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43921 samples/s/p 5:57:30 } +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 43/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 2.9999408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43124 samples/s/p 5:57:58 } +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 45/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9999354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44004 samples/s/p 5:57:21 } +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 47/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.999929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43516 samples/s/p 5:57:37 } +2024-07-25 19:10:16,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 49/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.9999228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:16,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43614 samples/s/p 5:57:30 } +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 51/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.9999163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43642 samples/s/p 5:57:26 } +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 53/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 2.9999095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:22,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.42395 samples/s/p 5:58:12 } +2024-07-25 19:10:25,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 55/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.9999024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:25,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44285 samples/s/p 5:56:55 } +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 57/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.999895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:28,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43129 samples/s/p 5:57:37 } +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 59/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 2.9998875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:31,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43999 samples/s/p 5:57:00 } +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 61/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.9998797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:34,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42957 samples/s/p 5:57:38 } +2024-07-25 19:10:37,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 63/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9998713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:37,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43269 samples/s/p 5:57:23 } +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 65/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.999863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:40,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42817 samples/s/p 5:57:38 } +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 67/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9998542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43217 samples/s/p 5:57:19 } +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 69/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.9998453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:46,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42884 samples/s/p 5:57:29 } +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 71/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.999836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43754 samples/s/p 5:56:52 } +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 73/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9998266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43533 samples/s/p 5:56:58 } +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 75/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9998168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43838 samples/s/p 5:56:43 } +2024-07-25 19:10:58,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 77/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9998067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:58,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43593 samples/s/p 5:56:50 } +2024-07-25 19:11:01,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 79/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9997964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:01,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43684 samples/s/p 5:56:43 } +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 81/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9997858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43411 samples/s/p 5:56:51 } +2024-07-25 19:11:07,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 83/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.999775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:07,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42673 samples/s/p 5:57:17 } +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 85/ 1625], loss: 1.437, per_step_time: 1471ms, lr: 2.9997638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43782 samples/s/p 5:56:30 } +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 87/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.9997524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:12,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42701 samples/s/p 5:57:10 } +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 89/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.9997409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:15,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43726 samples/s/p 5:56:27 } +2024-07-25 19:11:18,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 91/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9997289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:18,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43447 samples/s/p 5:56:35 } +2024-07-25 19:11:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 93/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.9997167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:21,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43179 samples/s/p 5:56:42 } +2024-07-25 19:11:24,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 95/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 2.9997043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:24,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43352 samples/s/p 5:56:33 } +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 97/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9996916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:27,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43339 samples/s/p 5:56:30 } +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 99/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9996787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43222 samples/s/p 5:56:32 } +2024-07-25 19:11:33,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 101/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 2.9996652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:33,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.44348 samples/s/p 5:55:45 } +2024-07-25 19:11:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 103/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.9996518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43172 samples/s/p 5:56:28 } +2024-07-25 19:11:39,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 105/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9996381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:39,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43846 samples/s/p 5:55:58 } +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 2.9996241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:42,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42394 samples/s/p 5:56:53 } +2024-07-25 19:11:45,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 109/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9996096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:45,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43644 samples/s/p 5:56:01 } +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 111/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 2.999595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43666 samples/s/p 5:55:57 } +2024-07-25 19:11:51,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 113/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 2.9995803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:51,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43055 samples/s/p 5:56:18 } +2024-07-25 19:11:54,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 115/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9995652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43663 samples/s/p 5:55:51 } +2024-07-25 19:11:57,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 117/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.9995497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:57,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43350 samples/s/p 5:56:00 } +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 119/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.9995343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43052 samples/s/p 5:56:09 } +2024-07-25 19:12:03,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 121/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9995184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:03,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42989 samples/s/p 5:56:09 } +2024-07-25 19:12:06,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 123/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.999502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:06,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43146 samples/s/p 5:55:59 } +2024-07-25 19:12:09,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 125/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 2.9994857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:09,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.44070 samples/s/p 5:55:20 } +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 127/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.9994688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43406 samples/s/p 5:55:43 } +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 129/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.999452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42980 samples/s/p 5:55:57 } +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 131/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.9994346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43832 samples/s/p 5:55:21 } +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 133/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.9994171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43975 samples/s/p 5:55:12 } +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 135/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.9993993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:23,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42755 samples/s/p 5:55:57 } +2024-07-25 19:12:26,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 137/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.9993813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:26,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43340 samples/s/p 5:55:31 } +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 139/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.9993627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43296 samples/s/p 5:55:30 } +2024-07-25 19:12:32,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 141/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.9993444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:32,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43450 samples/s/p 5:55:21 } +2024-07-25 19:12:35,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 143/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9993254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:35,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42901 samples/s/p 5:55:40 } +2024-07-25 19:12:38,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 145/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.9993065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:38,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43256 samples/s/p 5:55:23 } +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 147/ 1625], loss: 1.284, per_step_time: 1469ms, lr: 2.9992867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.44333 samples/s/p 5:54:38 } +2024-07-25 19:12:44,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 149/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.9992674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:44,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42874 samples/s/p 5:55:32 } +2024-07-25 19:12:47,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 151/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.9992474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:47,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43629 samples/s/p 5:54:59 } +2024-07-25 19:12:50,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 153/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.9992269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:50,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43217 samples/s/p 5:55:13 } +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 155/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9992065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:53,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43391 samples/s/p 5:55:03 } +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 157/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9991857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43184 samples/s/p 5:55:08 } +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 159/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9991646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43458 samples/s/p 5:54:54 } +2024-07-25 19:13:02,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 161/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9991435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:02,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43586 samples/s/p 5:54:46 } +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 163/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.9991223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43403 samples/s/p 5:54:51 } +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 165/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9991003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43129 samples/s/p 5:54:58 } +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 167/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.999078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43186 samples/s/p 5:54:53 } +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 169/ 1625], loss: 1.446, per_step_time: 1470ms, lr: 2.9990559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43870 samples/s/p 5:54:23 } +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 171/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 2.9990333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:16,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43252 samples/s/p 5:54:45 } +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 173/ 1625], loss: 1.360, per_step_time: 1473ms, lr: 2.9990104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43022 samples/s/p 5:54:51 } +2024-07-25 19:13:22,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 175/ 1625], loss: 1.309, per_step_time: 1471ms, lr: 2.9989871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:22,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43527 samples/s/p 5:54:28 } +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 177/ 1625], loss: 0.964, per_step_time: 1473ms, lr: 2.9989636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42839 samples/s/p 5:54:52 } +2024-07-25 19:13:28,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 179/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.99894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42821 samples/s/p 5:54:50 } +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 181/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 2.9989162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43856 samples/s/p 5:54:06 } +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 183/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.998892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.44067 samples/s/p 5:53:55 } +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 185/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 2.9988674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:37,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43052 samples/s/p 5:54:32 } +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 187/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9988425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43599 samples/s/p 5:54:08 } +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 189/ 1625], loss: 1.393, per_step_time: 1472ms, lr: 2.9988176e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43152 samples/s/p 5:54:22 } +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 191/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9987923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43130 samples/s/p 5:54:20 } +2024-07-25 19:13:49,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 193/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.9987668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:49,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43418 samples/s/p 5:54:06 } +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 195/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9987412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:52,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43373 samples/s/p 5:54:05 } +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 197/ 1625], loss: 1.166, per_step_time: 1469ms, lr: 2.998715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:55,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.44249 samples/s/p 5:53:27 } +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 199/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.9986886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43030 samples/s/p 5:54:12 } +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 201/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.9986619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43673 samples/s/p 5:53:44 } +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 203/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.9986351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43332 samples/s/p 5:53:54 } +2024-07-25 19:14:07,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 205/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9986079e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:07,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43750 samples/s/p 5:53:35 } +2024-07-25 19:14:10,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 207/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.9985804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:10,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42743 samples/s/p 5:54:12 } +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 209/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9985527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:12,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43206 samples/s/p 5:53:50 } +2024-07-25 19:14:15,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 211/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9985247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:15,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42706 samples/s/p 5:54:07 } +2024-07-25 19:14:18,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 213/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.9984965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:18,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43676 samples/s/p 5:53:26 } +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 215/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9984682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:21,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43459 samples/s/p 5:53:32 } +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 217/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.9984394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43745 samples/s/p 5:53:18 } +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 219/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.9984103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:27,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43133 samples/s/p 5:53:39 } +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 221/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.998381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43725 samples/s/p 5:53:13 } +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 223/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.9983512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:33,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43517 samples/s/p 5:53:18 } +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 225/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9983215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43473 samples/s/p 5:53:16 } +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 227/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9982915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43304 samples/s/p 5:53:20 } +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 229/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9982612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43852 samples/s/p 5:52:56 } +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 231/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.9982306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42937 samples/s/p 5:53:29 } +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 233/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9981999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43368 samples/s/p 5:53:09 } +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 235/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.9981686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:51,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42862 samples/s/p 5:53:26 } +2024-07-25 19:14:54,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 237/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.998137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:54,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43598 samples/s/p 5:52:54 } +2024-07-25 19:14:57,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 239/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.9981054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:57,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.44079 samples/s/p 5:52:32 } +2024-07-25 19:15:00,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 241/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.9980733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:00,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43787 samples/s/p 5:52:41 } +2024-07-25 19:15:03,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 243/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.9980412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42757 samples/s/p 5:53:18 } +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 245/ 1625], loss: 1.279, per_step_time: 1474ms, lr: 2.9980087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42718 samples/s/p 5:53:17 } +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 247/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 2.997976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:09,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42704 samples/s/p 5:53:14 } +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 249/ 1625], loss: 1.375, per_step_time: 1471ms, lr: 2.9979428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:12,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43482 samples/s/p 5:52:41 } +2024-07-25 19:15:14,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 251/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.9979094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:14,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43426 samples/s/p 5:52:40 } +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 253/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 2.9978759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43997 samples/s/p 5:52:15 } +2024-07-25 19:15:20,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 255/ 1625], loss: 1.137, per_step_time: 1469ms, lr: 2.997842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:20,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44232 samples/s/p 5:52:03 } +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 257/ 1625], loss: 1.338, per_step_time: 1472ms, lr: 2.9978082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:23,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43441 samples/s/p 5:52:31 } +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 259/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.9977735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43807 samples/s/p 5:52:13 } +2024-07-25 19:15:29,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 261/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 2.997739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:29,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43951 samples/s/p 5:52:05 } +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 263/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.997704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43973 samples/s/p 5:52:01 } +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 265/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9976689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43635 samples/s/p 5:52:11 } +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 267/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 2.9976336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43681 samples/s/p 5:52:07 } +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 269/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.9975978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43269 samples/s/p 5:52:20 } +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 271/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9975616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43879 samples/s/p 5:51:53 } +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 273/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9975256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43656 samples/s/p 5:51:59 } +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 275/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.997489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43441 samples/s/p 5:52:04 } +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 277/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.997452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43325 samples/s/p 5:52:06 } +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 279/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9974155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43303 samples/s/p 5:52:04 } +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 281/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9973779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43882 samples/s/p 5:51:38 } +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 283/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.9973404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43507 samples/s/p 5:51:50 } +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 285/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.9973024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.44026 samples/s/p 5:51:27 } +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 287/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.9972643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43508 samples/s/p 5:51:44 } +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 289/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.997226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.42919 samples/s/p 5:52:04 } +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 291/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9971872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:13,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43117 samples/s/p 5:51:53 } +2024-07-25 19:16:16,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 293/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9971485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:16,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43425 samples/s/p 5:51:38 } +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 295/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.9971094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43185 samples/s/p 5:51:45 } +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 297/ 1625], loss: 0.980, per_step_time: 1471ms, lr: 2.9970697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43840 samples/s/p 5:51:16 } +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 299/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9970299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:25,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43852 samples/s/p 5:51:13 } +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 301/ 1625], loss: 1.029, per_step_time: 1473ms, lr: 2.9969902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:28,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42991 samples/s/p 5:51:43 } +2024-07-25 19:16:31,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 303/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.99695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:31,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42711 samples/s/p 5:51:51 } +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 305/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9969093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:34,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43507 samples/s/p 5:51:17 } +2024-07-25 19:16:37,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 307/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9968685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:37,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44154 samples/s/p 5:50:49 } +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 309/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9968276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:40,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43336 samples/s/p 5:51:18 } +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 311/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9967863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:43,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43908 samples/s/p 5:50:53 } +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 313/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.9967445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:46,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43116 samples/s/p 5:51:21 } +2024-07-25 19:16:49,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 315/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.9967028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:49,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44337 samples/s/p 5:50:31 } +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 317/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.9966604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42914 samples/s/p 5:51:23 } +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 319/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9966182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43604 samples/s/p 5:50:53 } +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9965757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43330 samples/s/p 5:51:01 } +2024-07-25 19:17:01,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 323/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9965326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:01,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43021 samples/s/p 5:51:10 } +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 325/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.9964896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:04,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.44063 samples/s/p 5:50:26 } +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 327/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.996446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:07,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.42802 samples/s/p 5:51:12 } +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 329/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9964021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43783 samples/s/p 5:50:31 } +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 331/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.9963583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:13,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43415 samples/s/p 5:50:43 } +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 333/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.996314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43362 samples/s/p 5:50:42 } +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 335/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.9962694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43518 samples/s/p 5:50:33 } +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 337/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.9962248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:21,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43080 samples/s/p 5:50:47 } +2024-07-25 19:17:24,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 339/ 1625], loss: 1.010, per_step_time: 1470ms, lr: 2.9961797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:24,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.44108 samples/s/p 5:50:04 } +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 341/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.9961344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.44004 samples/s/p 5:50:05 } +2024-07-25 19:17:30,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 343/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.9960887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:30,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43369 samples/s/p 5:50:27 } +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 345/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.9960429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43731 samples/s/p 5:50:10 } +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 347/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.9959969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:36,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43297 samples/s/p 5:50:24 } +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 349/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9959503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43425 samples/s/p 5:50:16 } +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 351/ 1625], loss: 1.294, per_step_time: 1470ms, lr: 2.9959036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43930 samples/s/p 5:49:53 } +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 353/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.995857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43302 samples/s/p 5:50:15 } +2024-07-25 19:17:48,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 355/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.9958097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:48,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43572 samples/s/p 5:50:01 } +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 357/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 2.9957622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.44059 samples/s/p 5:49:40 } +2024-07-25 19:17:54,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 359/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.9957146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:54,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43143 samples/s/p 5:50:12 } +2024-07-25 19:17:57,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 361/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9956665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:57,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43758 samples/s/p 5:49:45 } +2024-07-25 19:18:00,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 363/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.9956182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:00,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43535 samples/s/p 5:49:51 } +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 365/ 1625], loss: 1.378, per_step_time: 1472ms, lr: 2.9955698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43185 samples/s/p 5:50:02 } +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 367/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.995521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43725 samples/s/p 5:49:38 } +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 369/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.995472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43338 samples/s/p 5:49:50 } +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 371/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9954224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43372 samples/s/p 5:49:45 } +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 373/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9953728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43252 samples/s/p 5:49:47 } +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 375/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.995323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43152 samples/s/p 5:49:48 } +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 377/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9952727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:20,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43272 samples/s/p 5:49:41 } +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 379/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.9952223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43240 samples/s/p 5:49:39 } +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 381/ 1625], loss: 1.076, per_step_time: 1469ms, lr: 2.9951718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:26,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.44370 samples/s/p 5:48:52 } +2024-07-25 19:18:29,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 383/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.995121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:29,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43734 samples/s/p 5:49:14 } +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 385/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.9950697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42922 samples/s/p 5:49:42 } +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 387/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9950183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43884 samples/s/p 5:49:02 } +2024-07-25 19:18:38,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 389/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.9949666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:38,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43194 samples/s/p 5:49:26 } +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 391/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.9949146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:41,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43249 samples/s/p 5:49:21 } +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 393/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.9948624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42842 samples/s/p 5:49:34 } +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 395/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.9948098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:47,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.44231 samples/s/p 5:48:37 } +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 397/ 1625], loss: 1.052, per_step_time: 1473ms, lr: 2.9947569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42904 samples/s/p 5:49:25 } +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 399/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.9947041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:53,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43653 samples/s/p 5:48:53 } +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 401/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.9946505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43597 samples/s/p 5:48:53 } +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 403/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.994597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.44102 samples/s/p 5:48:30 } +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 405/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.994543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.42932 samples/s/p 5:49:12 } +2024-07-25 19:19:05,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 407/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 2.994489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:05,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43939 samples/s/p 5:48:31 } +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 409/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.9944347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:08,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43353 samples/s/p 5:48:50 } +2024-07-25 19:19:11,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 411/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 2.9943802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:11,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.44022 samples/s/p 5:48:22 } +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 413/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9943252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43317 samples/s/p 5:48:46 } +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 415/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.9942697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:16,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43746 samples/s/p 5:48:26 } +2024-07-25 19:19:19,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 417/ 1625], loss: 0.937, per_step_time: 1471ms, lr: 2.994214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:19,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43623 samples/s/p 5:48:28 } +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 419/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 2.9941586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42688 samples/s/p 5:49:01 } +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 421/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 2.9941026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44009 samples/s/p 5:48:07 } +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 423/ 1625], loss: 1.266, per_step_time: 1469ms, lr: 2.9940466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44458 samples/s/p 5:47:47 } +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 425/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.9939898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43663 samples/s/p 5:48:15 } +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 427/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9939329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42963 samples/s/p 5:48:39 } +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 429/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9938761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42953 samples/s/p 5:48:36 } +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 431/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9938186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43468 samples/s/p 5:48:13 } +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 433/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.9937613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.44048 samples/s/p 5:47:48 } +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 435/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9937031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43362 samples/s/p 5:48:12 } +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 437/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9936451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43602 samples/s/p 5:47:59 } +2024-07-25 19:19:52,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 439/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.9935867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:52,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43583 samples/s/p 5:47:57 } +2024-07-25 19:19:55,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.993528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:55,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.44213 samples/s/p 5:47:30 } +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 443/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.9934692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43523 samples/s/p 5:47:54 } +2024-07-25 19:20:01,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 445/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.9934099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:01,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43398 samples/s/p 5:47:56 } +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 447/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.9933506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43247 samples/s/p 5:47:58 } +2024-07-25 19:20:07,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 449/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.9932908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:07,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43307 samples/s/p 5:47:53 } +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 451/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:10,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43373 samples/s/p 5:47:48 } +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 453/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9931705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:13,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43139 samples/s/p 5:47:54 } +2024-07-25 19:20:15,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 455/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.99311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:15,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43186 samples/s/p 5:47:49 } +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 457/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.9930492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43642 samples/s/p 5:47:29 } +2024-07-25 19:20:21,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 459/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.992988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:21,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43180 samples/s/p 5:47:43 } +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 461/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9929268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.42547 samples/s/p 5:48:05 } +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 463/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.9928653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.44078 samples/s/p 5:47:03 } +2024-07-25 19:20:30,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 465/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.9928033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.42946 samples/s/p 5:47:43 } +2024-07-25 19:20:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 467/ 1625], loss: 1.345, per_step_time: 1472ms, lr: 2.9927412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43312 samples/s/p 5:47:26 } +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 469/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9926789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:36,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43553 samples/s/p 5:47:14 } +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 471/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.9926163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43537 samples/s/p 5:47:12 } +2024-07-25 19:20:42,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 473/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 2.9925533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:42,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43784 samples/s/p 5:47:00 } +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 475/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.99249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:45,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.44537 samples/s/p 5:46:28 } +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 477/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.9924267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43767 samples/s/p 5:46:54 } +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 479/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9923629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43615 samples/s/p 5:46:57 } +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 481/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.9922989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43316 samples/s/p 5:47:06 } +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 483/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.9922347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43266 samples/s/p 5:47:05 } +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 485/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.9921703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:00,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43968 samples/s/p 5:46:35 } +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 487/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.9921053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:03,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43266 samples/s/p 5:46:59 } +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 489/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9920404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43153 samples/s/p 5:47:00 } +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 491/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.991975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43545 samples/s/p 5:46:42 } +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 493/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.9919096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44174 samples/s/p 5:46:15 } +2024-07-25 19:21:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 495/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9918436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43061 samples/s/p 5:46:55 } +2024-07-25 19:21:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 497/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.9917775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:17,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43864 samples/s/p 5:46:21 } +2024-07-25 19:21:20,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 499/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.9917113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:20,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43665 samples/s/p 5:46:26 } +2024-07-25 19:21:23,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 501/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.9916446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:23,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43642 samples/s/p 5:46:24 } +2024-07-25 19:21:26,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 503/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 2.9915775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:26,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43528 samples/s/p 5:46:25 } +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 505/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9915103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43613 samples/s/p 5:46:19 } +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 507/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.991443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.42938 samples/s/p 5:46:42 } +2024-07-25 19:21:35,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 509/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9913752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:35,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43764 samples/s/p 5:46:07 } +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 511/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.9913072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43715 samples/s/p 5:46:06 } +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 513/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.991239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:41,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43446 samples/s/p 5:46:14 } +2024-07-25 19:21:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 515/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.9911704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:44,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43787 samples/s/p 5:45:58 } +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 517/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.9911018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43002 samples/s/p 5:46:25 } +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 519/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9910327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:50,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43591 samples/s/p 5:45:59 } +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 521/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9909634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43268 samples/s/p 5:46:09 } +2024-07-25 19:21:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 523/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9908939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43288 samples/s/p 5:46:05 } +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 525/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9908242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43615 samples/s/p 5:45:49 } +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 527/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.9907538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.44123 samples/s/p 5:45:27 } +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 529/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.9906834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43155 samples/s/p 5:46:01 } +2024-07-25 19:22:08,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 531/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.9906128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:08,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43500 samples/s/p 5:45:45 } +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 533/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.990542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.42897 samples/s/p 5:46:05 } +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 535/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.9904708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43283 samples/s/p 5:45:47 } +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 537/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.9903993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:16,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43598 samples/s/p 5:45:32 } +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 539/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 2.9903278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:19,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43516 samples/s/p 5:45:33 } +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 541/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9902556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:22,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43493 samples/s/p 5:45:31 } +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 543/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.9901834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43568 samples/s/p 5:45:25 } +2024-07-25 19:22:28,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 545/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 2.990111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:28,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44117 samples/s/p 5:45:01 } +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 547/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 2.990038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:31,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43274 samples/s/p 5:45:30 } +2024-07-25 19:22:34,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 549/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9899651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:34,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43462 samples/s/p 5:45:20 } +2024-07-25 19:22:37,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 551/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9898918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:37,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43266 samples/s/p 5:45:25 } +2024-07-25 19:22:40,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 553/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.9898185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:40,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43844 samples/s/p 5:45:00 } +2024-07-25 19:22:43,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 555/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.9897445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:43,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44090 samples/s/p 5:44:47 } +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 557/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 2.9896704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:46,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43034 samples/s/p 5:45:25 } +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 559/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9895962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.42884 samples/s/p 5:45:27 } +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 561/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9895215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:52,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43636 samples/s/p 5:44:56 } +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 563/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.9894465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:55,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.44117 samples/s/p 5:44:34 } +2024-07-25 19:22:58,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 565/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 2.9893716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:58,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43077 samples/s/p 5:45:11 } +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 567/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.9892959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43645 samples/s/p 5:44:47 } +2024-07-25 19:23:04,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 569/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9892202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:04,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43570 samples/s/p 5:44:46 } +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 571/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.9891444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:07,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43566 samples/s/p 5:44:44 } +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 573/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9890682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:10,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43836 samples/s/p 5:44:30 } +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 575/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9889916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43441 samples/s/p 5:44:43 } +2024-07-25 19:23:15,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 577/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9889148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:15,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43168 samples/s/p 5:44:50 } +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 579/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.9888379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:18,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43836 samples/s/p 5:44:22 } +2024-07-25 19:23:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 581/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.9887606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:21,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43610 samples/s/p 5:44:27 } +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 583/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.988683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43487 samples/s/p 5:44:29 } +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 585/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.9886052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43648 samples/s/p 5:44:20 } +2024-07-25 19:23:30,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 587/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 2.9885274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:30,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43078 samples/s/p 5:44:39 } +2024-07-25 19:23:33,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 589/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.9884488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:33,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43317 samples/s/p 5:44:27 } +2024-07-25 19:23:36,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 591/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9883704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:36,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43364 samples/s/p 5:44:22 } +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 593/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.988291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42767 samples/s/p 5:44:42 } +2024-07-25 19:23:42,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 595/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.988212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:42,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43759 samples/s/p 5:44:01 } +2024-07-25 19:23:45,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 597/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.9881328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:45,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43230 samples/s/p 5:44:18 } +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 599/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.9880532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43974 samples/s/p 5:43:47 } +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 601/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.9879731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43548 samples/s/p 5:44:00 } +2024-07-25 19:23:54,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 603/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 2.9878931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:54,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43577 samples/s/p 5:43:56 } +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 605/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 2.9878125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:57,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43353 samples/s/p 5:44:02 } +2024-07-25 19:24:00,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 607/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.9877318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:00,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43062 samples/s/p 5:44:10 } +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 609/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.987651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43224 samples/s/p 5:44:01 } +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 611/ 1625], loss: 1.324, per_step_time: 1473ms, lr: 2.9875695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:06,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43093 samples/s/p 5:44:03 } +2024-07-25 19:24:09,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 613/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9874882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:09,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43602 samples/s/p 5:43:40 } +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 615/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9874062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.42745 samples/s/p 5:44:10 } +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 617/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9873243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43535 samples/s/p 5:43:37 } +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 619/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.9872419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:17,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43618 samples/s/p 5:43:31 } +2024-07-25 19:24:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 621/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.9871593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:20,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43841 samples/s/p 5:43:20 } +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 623/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9870764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:23,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43370 samples/s/p 5:43:35 } +2024-07-25 19:24:26,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 625/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.9869934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:26,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43278 samples/s/p 5:43:35 } +2024-07-25 19:24:29,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 627/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9869097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:29,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43391 samples/s/p 5:43:28 } +2024-07-25 19:24:32,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 629/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.986826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:32,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43436 samples/s/p 5:43:23 } +2024-07-25 19:24:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 631/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 2.9867424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:35,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43079 samples/s/p 5:43:34 } +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 633/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.986658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43561 samples/s/p 5:43:13 } +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 635/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 2.9865738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43915 samples/s/p 5:42:56 } +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 637/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.986489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43702 samples/s/p 5:43:01 } +2024-07-25 19:24:47,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 639/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9864039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:47,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.44095 samples/s/p 5:42:44 } +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 641/ 1625], loss: 1.287, per_step_time: 1474ms, lr: 2.9863188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42416 samples/s/p 5:43:44 } +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 643/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9862333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43259 samples/s/p 5:43:09 } +2024-07-25 19:24:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 645/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.9861474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:56,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43576 samples/s/p 5:42:54 } +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 2.9860614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.44184 samples/s/p 5:42:28 } +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 649/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9859752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:02,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43552 samples/s/p 5:42:49 } +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9858886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43539 samples/s/p 5:42:47 } +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 653/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.9858018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43394 samples/s/p 5:42:49 } +2024-07-25 19:25:11,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 655/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 2.9857147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:11,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43787 samples/s/p 5:42:32 } +2024-07-25 19:25:14,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 657/ 1625], loss: 1.191, per_step_time: 1476ms, lr: 2.9856272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:14,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.41968 samples/s/p 5:43:38 } +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 659/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.9855397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43604 samples/s/p 5:42:33 } +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 661/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 2.9854516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43487 samples/s/p 5:42:34 } +2024-07-25 19:25:22,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 663/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.9853638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:22,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42860 samples/s/p 5:42:55 } +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 665/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.9852752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43033 samples/s/p 5:42:45 } +2024-07-25 19:25:28,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 667/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.9851866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:28,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43650 samples/s/p 5:42:19 } +2024-07-25 19:25:31,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 669/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9850975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:31,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43089 samples/s/p 5:42:37 } +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 671/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.9850084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:34,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43894 samples/s/p 5:42:04 } +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 673/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.984919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43339 samples/s/p 5:42:22 } +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 675/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.9848292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:40,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43477 samples/s/p 5:42:14 } +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 677/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.984739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:43,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43232 samples/s/p 5:42:20 } +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 679/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9846487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:46,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43497 samples/s/p 5:42:07 } +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 681/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.9845582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.42892 samples/s/p 5:42:27 } +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 683/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 2.9844676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43128 samples/s/p 5:42:15 } +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 685/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.9843766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43808 samples/s/p 5:41:47 } +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 687/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.9842851e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43801 samples/s/p 5:41:44 } +2024-07-25 19:26:01,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 689/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9841935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:01,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43209 samples/s/p 5:42:03 } +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 691/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 2.9841016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43093 samples/s/p 5:42:05 } +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 693/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9840096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43466 samples/s/p 5:41:48 } +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 695/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 2.9839173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:10,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42825 samples/s/p 5:42:09 } +2024-07-25 19:26:13,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 697/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9838244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:13,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43282 samples/s/p 5:41:49 } +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 699/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.9837316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42896 samples/s/p 5:42:01 } +2024-07-25 19:26:18,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 701/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9836385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:18,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43737 samples/s/p 5:41:26 } +2024-07-25 19:26:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 703/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.9835448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:21,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.44084 samples/s/p 5:41:10 } +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 705/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.9834513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43545 samples/s/p 5:41:27 } +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 707/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9833573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43315 samples/s/p 5:41:33 } +2024-07-25 19:26:30,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 709/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.9832629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:30,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43008 samples/s/p 5:41:42 } +2024-07-25 19:26:33,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 711/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.9831685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:33,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43102 samples/s/p 5:41:35 } +2024-07-25 19:26:36,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 713/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9830737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:36,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43310 samples/s/p 5:41:24 } +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 715/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.9829787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:39,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43668 samples/s/p 5:41:08 } +2024-07-25 19:26:42,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 717/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.9828832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43444 samples/s/p 5:41:13 } +2024-07-25 19:26:45,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 719/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.982788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:45,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43348 samples/s/p 5:41:14 } +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 721/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.982692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43326 samples/s/p 5:41:12 } +2024-07-25 19:26:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 723/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.982596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43236 samples/s/p 5:41:12 } +2024-07-25 19:26:54,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 725/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 2.9824996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43057 samples/s/p 5:41:16 } +2024-07-25 19:26:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 727/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.9824028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43215 samples/s/p 5:41:07 } +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 729/ 1625], loss: 1.359, per_step_time: 1474ms, lr: 2.9823059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42662 samples/s/p 5:41:25 } +2024-07-25 19:27:03,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 731/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.9822088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:03,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43560 samples/s/p 5:40:48 } +2024-07-25 19:27:06,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 733/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9821114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:06,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43297 samples/s/p 5:40:55 } +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 735/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9820138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43821 samples/s/p 5:40:33 } +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 737/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9819159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:12,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43406 samples/s/p 5:40:45 } +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 739/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9818177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43003 samples/s/p 5:40:58 } +2024-07-25 19:27:18,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 741/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9817189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:18,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43113 samples/s/p 5:40:51 } +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 743/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.9816205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:20,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43377 samples/s/p 5:40:38 } +2024-07-25 19:27:23,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 745/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.9815214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:23,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.44100 samples/s/p 5:40:08 } +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 747/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.9814222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:26,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43522 samples/s/p 5:40:26 } +2024-07-25 19:27:29,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 749/ 1625], loss: 1.235, per_step_time: 1474ms, lr: 2.9813224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42693 samples/s/p 5:40:55 } +2024-07-25 19:27:32,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 751/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.9812229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42573 samples/s/p 5:40:56 } +2024-07-25 19:27:35,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 753/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9811226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:35,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43138 samples/s/p 5:40:32 } +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 755/ 1625], loss: 1.218, per_step_time: 1481ms, lr: 2.9810224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.39828 samples/s/p 5:42:34 } +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 757/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9809218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43103 samples/s/p 5:40:27 } +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 759/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.9808209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43015 samples/s/p 5:40:28 } +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 761/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.98072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43176 samples/s/p 5:40:19 } +2024-07-25 19:27:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 763/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9806186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43036 samples/s/p 5:40:21 } +2024-07-25 19:27:53,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 765/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9805167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:53,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43484 samples/s/p 5:40:01 } +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 767/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.9804149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:56,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43394 samples/s/p 5:40:02 } +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 769/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.9803128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42794 samples/s/p 5:40:21 } +2024-07-25 19:28:02,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 771/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.9802102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43028 samples/s/p 5:40:10 } +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 773/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.9801076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43450 samples/s/p 5:39:51 } +2024-07-25 19:28:08,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 775/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.9800045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:08,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44313 samples/s/p 5:39:15 } +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 777/ 1625], loss: 1.292, per_step_time: 1474ms, lr: 2.9799015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42640 samples/s/p 5:40:15 } +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 779/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.9797979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44021 samples/s/p 5:39:20 } +2024-07-25 19:28:17,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 781/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.9796942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43391 samples/s/p 5:39:41 } +2024-07-25 19:28:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 783/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9795901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43029 samples/s/p 5:39:52 } +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 785/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9794859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43430 samples/s/p 5:39:34 } +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 787/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9793813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:25,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43078 samples/s/p 5:39:44 } +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 789/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9792765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43679 samples/s/p 5:39:19 } +2024-07-25 19:28:31,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 791/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9791714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:31,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43300 samples/s/p 5:39:30 } +2024-07-25 19:28:34,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 793/ 1625], loss: 0.885, per_step_time: 1470ms, lr: 2.979066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:34,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.44180 samples/s/p 5:38:54 } +2024-07-25 19:28:37,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 795/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9789604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43682 samples/s/p 5:39:10 } +2024-07-25 19:28:40,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 797/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9788547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:40,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43471 samples/s/p 5:39:15 } +2024-07-25 19:28:43,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 799/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9787485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:43,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43638 samples/s/p 5:39:05 } +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 801/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 2.978642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43354 samples/s/p 5:39:13 } +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 803/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9785355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43870 samples/s/p 5:38:51 } +2024-07-25 19:28:52,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 805/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9784285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:52,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43786 samples/s/p 5:38:51 } +2024-07-25 19:28:55,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 807/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9783214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:55,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43835 samples/s/p 5:38:46 } +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 809/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9782139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:58,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43264 samples/s/p 5:39:05 } +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 811/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.9781062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43807 samples/s/p 5:38:41 } +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 813/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.9779982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.42932 samples/s/p 5:39:11 } +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 815/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.97789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:07,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43427 samples/s/p 5:38:50 } +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 817/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9777813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:10,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43140 samples/s/p 5:38:58 } +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 819/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.9776727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:13,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43471 samples/s/p 5:38:42 } +2024-07-25 19:29:16,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 821/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.9775636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:16,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43437 samples/s/p 5:38:41 } +2024-07-25 19:29:19,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 823/ 1625], loss: 1.268, per_step_time: 1470ms, lr: 2.9774543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:19,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43905 samples/s/p 5:38:20 } +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 825/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9773448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:22,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.44087 samples/s/p 5:38:10 } +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 827/ 1625], loss: 1.146, per_step_time: 1477ms, lr: 2.977235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.41494 samples/s/p 5:39:45 } +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 829/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.9771249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43941 samples/s/p 5:38:10 } +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 831/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.9770146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:30,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43542 samples/s/p 5:38:22 } +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 833/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 2.9769039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43253 samples/s/p 5:38:30 } +2024-07-25 19:29:36,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 835/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.9767929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:36,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43882 samples/s/p 5:38:03 } +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 837/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 2.976682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42869 samples/s/p 5:38:38 } +2024-07-25 19:29:42,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 839/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.9765704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:42,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43629 samples/s/p 5:38:07 } +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 841/ 1625], loss: 0.965, per_step_time: 1472ms, lr: 2.9764587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43215 samples/s/p 5:38:19 } +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 843/ 1625], loss: 1.341, per_step_time: 1470ms, lr: 2.976347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.44036 samples/s/p 5:37:46 } +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 845/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9762348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42985 samples/s/p 5:38:22 } +2024-07-25 19:29:54,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 847/ 1625], loss: 1.444, per_step_time: 1471ms, lr: 2.9761222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:54,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43674 samples/s/p 5:37:53 } +2024-07-25 19:29:57,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 849/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9760096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:57,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43267 samples/s/p 5:38:06 } +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 851/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.9758965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43222 samples/s/p 5:38:04 } +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 853/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9757832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42987 samples/s/p 5:38:10 } +2024-07-25 19:30:06,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 855/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.9756698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:06,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43626 samples/s/p 5:37:43 } +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 857/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.975556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43400 samples/s/p 5:37:49 } +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 859/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.975442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:12,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43794 samples/s/p 5:37:31 } +2024-07-25 19:30:15,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 861/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9753279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:15,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43384 samples/s/p 5:37:44 } +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 863/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9752133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42931 samples/s/p 5:37:58 } +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 865/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9750983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42549 samples/s/p 5:38:09 } +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 867/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9749832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43773 samples/s/p 5:37:20 } +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 869/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.9748679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43526 samples/s/p 5:37:27 } +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 871/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.9747522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44235 samples/s/p 5:36:57 } +2024-07-25 19:30:32,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 873/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.9746365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:32,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43657 samples/s/p 5:37:16 } +2024-07-25 19:30:35,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 875/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.9745202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43773 samples/s/p 5:37:09 } +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 877/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.9744038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43518 samples/s/p 5:37:15 } +2024-07-25 19:30:41,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 879/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9742872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:41,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43394 samples/s/p 5:37:17 } +2024-07-25 19:30:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 881/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9741705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:44,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43732 samples/s/p 5:37:01 } +2024-07-25 19:30:47,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 883/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 2.9740533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:47,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43596 samples/s/p 5:37:03 } +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 885/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 2.9739356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44174 samples/s/p 5:36:39 } +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 887/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9738178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:53,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43468 samples/s/p 5:37:02 } +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 889/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 2.9736999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:56,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.44028 samples/s/p 5:36:38 } +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 891/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9735816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42990 samples/s/p 5:37:14 } +2024-07-25 19:31:02,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 893/ 1625], loss: 1.258, per_step_time: 1474ms, lr: 2.973463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:02,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42660 samples/s/p 5:37:23 } +2024-07-25 19:31:05,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 895/ 1625], loss: 1.282, per_step_time: 1470ms, lr: 2.9733445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:05,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43894 samples/s/p 5:36:35 } +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 897/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.9732257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.44070 samples/s/p 5:36:25 } +2024-07-25 19:31:11,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 899/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.973106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43182 samples/s/p 5:36:55 } +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 901/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 2.9729865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42928 samples/s/p 5:37:02 } +2024-07-25 19:31:17,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 903/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9728668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:17,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43561 samples/s/p 5:36:35 } +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 905/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9727466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43556 samples/s/p 5:36:32 } +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 907/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9726263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43688 samples/s/p 5:36:25 } +2024-07-25 19:31:25,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 909/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9725057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:25,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43184 samples/s/p 5:36:40 } +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 911/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.972385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.44126 samples/s/p 5:36:02 } +2024-07-25 19:31:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 913/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.9722638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43559 samples/s/p 5:36:21 } +2024-07-25 19:31:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 915/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9721425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.42985 samples/s/p 5:36:39 } +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 917/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9720208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43771 samples/s/p 5:36:07 } +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 919/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9718987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.44132 samples/s/p 5:35:50 } +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 921/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9717767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43604 samples/s/p 5:36:07 } +2024-07-25 19:31:46,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 923/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 2.9716544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43488 samples/s/p 5:36:08 } +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 925/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9715315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43218 samples/s/p 5:36:16 } +2024-07-25 19:31:52,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 927/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.9714083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:52,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43491 samples/s/p 5:36:02 } +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 929/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 2.9712852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:55,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43413 samples/s/p 5:36:02 } +2024-07-25 19:31:58,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 931/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.9711617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43492 samples/s/p 5:35:57 } +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 933/ 1625], loss: 1.436, per_step_time: 1474ms, lr: 2.971038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.42706 samples/s/p 5:36:23 } +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 935/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9709141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:04,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43079 samples/s/p 5:36:06 } +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 937/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:07,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43681 samples/s/p 5:35:41 } +2024-07-25 19:32:10,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 939/ 1625], loss: 1.044, per_step_time: 1481ms, lr: 2.9706653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:10,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.39954 samples/s/p 5:37:57 } +2024-07-25 19:32:13,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 941/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9705405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:13,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43844 samples/s/p 5:35:29 } +2024-07-25 19:32:16,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 943/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9704153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43309 samples/s/p 5:35:46 } +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 945/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.9702898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:19,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43536 samples/s/p 5:35:34 } +2024-07-25 19:32:22,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 947/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.9701643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43866 samples/s/p 5:35:19 } +2024-07-25 19:32:25,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 949/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.9700386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:25,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43420 samples/s/p 5:35:33 } +2024-07-25 19:32:27,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 951/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.9699124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:27,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43449 samples/s/p 5:35:29 } +2024-07-25 19:32:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 953/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 2.9697861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:30,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43362 samples/s/p 5:35:29 } +2024-07-25 19:32:33,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 955/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9696595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:33,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43032 samples/s/p 5:35:38 } +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 957/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9695326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:36,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42932 samples/s/p 5:35:39 } +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 959/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9694054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43278 samples/s/p 5:35:23 } +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 961/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 2.969278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43094 samples/s/p 5:35:27 } +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.9691504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43040 samples/s/p 5:35:26 } +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 965/ 1625], loss: 1.397, per_step_time: 1483ms, lr: 2.9690224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:48,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.39164 samples/s/p 5:37:48 } +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 967/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9688941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43547 samples/s/p 5:35:02 } +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 969/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.9687657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43516 samples/s/p 5:35:00 } +2024-07-25 19:32:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 971/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.9686367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:57,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43340 samples/s/p 5:35:03 } +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 973/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9685078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:00,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43344 samples/s/p 5:35:00 } +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 975/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 2.9683788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43858 samples/s/p 5:34:38 } +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 977/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.9682491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.42799 samples/s/p 5:35:15 } +2024-07-25 19:33:09,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 979/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.9681194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:09,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43890 samples/s/p 5:34:31 } +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 981/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.9679892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43748 samples/s/p 5:34:34 } +2024-07-25 19:33:15,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 983/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.967859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:15,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43210 samples/s/p 5:34:50 } +2024-07-25 19:33:18,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 985/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.9677285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:18,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43322 samples/s/p 5:34:43 } +2024-07-25 19:33:21,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 987/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.9675975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:21,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43356 samples/s/p 5:34:39 } +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 989/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 2.9674666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43206 samples/s/p 5:34:42 } +2024-07-25 19:33:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 991/ 1625], loss: 1.347, per_step_time: 1471ms, lr: 2.967335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:27,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43810 samples/s/p 5:34:17 } +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 993/ 1625], loss: 1.390, per_step_time: 1472ms, lr: 2.9672035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43435 samples/s/p 5:34:27 } +2024-07-25 19:33:32,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 995/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.9670717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:32,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43905 samples/s/p 5:34:07 } +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 997/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.9669396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43301 samples/s/p 5:34:26 } +2024-07-25 19:33:38,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 999/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 2.9668072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:38,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43722 samples/s/p 5:34:08 } +2024-07-25 19:33:41,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1001/ 1625], loss: 0.931, per_step_time: 1471ms, lr: 2.9666744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:41,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43668 samples/s/p 5:34:07 } +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1003/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9665418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43594 samples/s/p 5:34:07 } +2024-07-25 19:33:47,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1005/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9664083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:47,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42864 samples/s/p 5:34:31 } +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1007/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 2.966275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:50,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.44335 samples/s/p 5:33:34 } +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1009/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9661414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43727 samples/s/p 5:33:53 } +2024-07-25 19:33:56,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1011/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9660072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:56,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43601 samples/s/p 5:33:55 } +2024-07-25 19:33:59,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1013/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9658731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:59,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42911 samples/s/p 5:34:17 } +2024-07-25 19:34:02,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1015/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.9657387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:02,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43410 samples/s/p 5:33:56 } +2024-07-25 19:34:05,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1017/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 2.9656037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:05,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.42582 samples/s/p 5:34:24 } +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1019/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 2.9654688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.44189 samples/s/p 5:33:21 } +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1021/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9653334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:11,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43041 samples/s/p 5:34:01 } +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1023/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9651981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43176 samples/s/p 5:33:53 } +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1025/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.965062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43384 samples/s/p 5:33:42 } +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1027/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 2.964926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43084 samples/s/p 5:33:50 } +2024-07-25 19:34:23,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1029/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.9647897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:23,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43451 samples/s/p 5:33:34 } +2024-07-25 19:34:26,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1031/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9646533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43143 samples/s/p 5:33:42 } +2024-07-25 19:34:29,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1033/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9645162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:29,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43224 samples/s/p 5:33:36 } +2024-07-25 19:34:31,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1035/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 2.9643794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:31,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43037 samples/s/p 5:33:40 } +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1037/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.964242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:34,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43659 samples/s/p 5:33:14 } +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1039/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.9641044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43261 samples/s/p 5:33:26 } +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1041/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9639665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43303 samples/s/p 5:33:22 } +2024-07-25 19:34:43,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1043/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9638284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:43,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43582 samples/s/p 5:33:08 } +2024-07-25 19:34:46,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1045/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.96369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.42948 samples/s/p 5:33:29 } +2024-07-25 19:34:49,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1047/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.9635514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:49,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43512 samples/s/p 5:33:05 } +2024-07-25 19:34:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1049/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.9634124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:52,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43832 samples/s/p 5:32:50 } +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1051/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.963273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43442 samples/s/p 5:33:02 } +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1053/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9631337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43713 samples/s/p 5:32:49 } +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1055/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.962994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44142 samples/s/p 5:32:30 } +2024-07-25 19:35:04,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1057/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.962854e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:04,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44025 samples/s/p 5:32:32 } +2024-07-25 19:35:07,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1059/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 2.9627137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:07,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43522 samples/s/p 5:32:47 } +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1061/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9625733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43312 samples/s/p 5:32:52 } +2024-07-25 19:35:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1063/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.9624325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43983 samples/s/p 5:32:24 } +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1065/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.9622914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43221 samples/s/p 5:32:49 } +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1067/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.9621502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43487 samples/s/p 5:32:37 } +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1069/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9620089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43337 samples/s/p 5:32:39 } +2024-07-25 19:35:25,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1071/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.961867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:25,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43589 samples/s/p 5:32:27 } +2024-07-25 19:35:28,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1073/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.961725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:28,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43575 samples/s/p 5:32:25 } +2024-07-25 19:35:30,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1075/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9615825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:30,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43266 samples/s/p 5:32:33 } +2024-07-25 19:35:33,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1077/ 1625], loss: 1.142, per_step_time: 1469ms, lr: 2.9614399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:33,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.44391 samples/s/p 5:31:49 } +2024-07-25 19:35:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1079/ 1625], loss: 1.244, per_step_time: 1475ms, lr: 2.961297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.42036 samples/s/p 5:33:12 } +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1081/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9611541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:39,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43016 samples/s/p 5:32:33 } +2024-07-25 19:35:42,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1083/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9610108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:42,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43654 samples/s/p 5:32:07 } +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1085/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.960867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43353 samples/s/p 5:32:15 } +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1087/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 2.9607232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43762 samples/s/p 5:31:57 } +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1089/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.960579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43818 samples/s/p 5:31:52 } +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1091/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.9604347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43459 samples/s/p 5:32:02 } +2024-07-25 19:35:57,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1093/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.96029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:57,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.42906 samples/s/p 5:32:20 } +2024-07-25 19:36:00,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1095/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.9601451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43261 samples/s/p 5:32:04 } +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1097/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.96e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43401 samples/s/p 5:31:56 } +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1099/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.9598543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42634 samples/s/p 5:32:21 } +2024-07-25 19:36:09,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1101/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9597088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:09,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43966 samples/s/p 5:31:29 } +2024-07-25 19:36:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1103/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 2.9595627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42773 samples/s/p 5:32:10 } +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1105/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.9594165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:15,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43511 samples/s/p 5:31:40 } +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1107/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9592702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43156 samples/s/p 5:31:50 } +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1109/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.9591232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:21,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42920 samples/s/p 5:31:56 } +2024-07-25 19:36:24,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.9589763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:24,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43115 samples/s/p 5:31:45 } +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1113/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 2.958829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:27,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42967 samples/s/p 5:31:48 } +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1115/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.9586816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43903 samples/s/p 5:31:11 } +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1117/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 2.9585337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:32,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43104 samples/s/p 5:31:37 } +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1119/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.9583858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:35,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43543 samples/s/p 5:31:18 } +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1121/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9582376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43390 samples/s/p 5:31:21 } +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1123/ 1625], loss: 1.430, per_step_time: 1471ms, lr: 2.9580888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43644 samples/s/p 5:31:08 } +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1125/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.95794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43517 samples/s/p 5:31:10 } +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1127/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.9577908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:47,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.44557 samples/s/p 5:30:29 } +2024-07-25 19:36:50,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1129/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9576418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:50,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.42946 samples/s/p 5:31:25 } +2024-07-25 19:36:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9574921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43720 samples/s/p 5:30:54 } +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1133/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.957342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43059 samples/s/p 5:31:15 } +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1135/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.957192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43688 samples/s/p 5:30:49 } +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1137/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.9570418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:02,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.44005 samples/s/p 5:30:35 } +2024-07-25 19:37:05,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1139/ 1625], loss: 1.414, per_step_time: 1472ms, lr: 2.9568911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:05,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43447 samples/s/p 5:30:52 } +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1141/ 1625], loss: 1.430, per_step_time: 1471ms, lr: 2.9567402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:08,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43490 samples/s/p 5:30:48 } +2024-07-25 19:37:11,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1143/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.9565892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:11,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43517 samples/s/p 5:30:44 } +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1145/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.9564375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:14,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.44048 samples/s/p 5:30:21 } +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1147/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.956286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43588 samples/s/p 5:30:35 } +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9561339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:20,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42883 samples/s/p 5:30:58 } +2024-07-25 19:37:23,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1151/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.9559818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:23,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43447 samples/s/p 5:30:34 } +2024-07-25 19:37:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1153/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.9558292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42985 samples/s/p 5:30:48 } +2024-07-25 19:37:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1155/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9556764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43546 samples/s/p 5:30:25 } +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1157/ 1625], loss: 1.392, per_step_time: 1473ms, lr: 2.9555236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43022 samples/s/p 5:30:41 } +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1159/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9553703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43670 samples/s/p 5:30:14 } +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1161/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.955217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:37,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42903 samples/s/p 5:30:40 } +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1163/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 2.9550632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.44321 samples/s/p 5:29:45 } +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1165/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.954909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:43,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.42953 samples/s/p 5:30:32 } +2024-07-25 19:37:46,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1167/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.954755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:46,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43496 samples/s/p 5:30:09 } +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1169/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9546003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43575 samples/s/p 5:30:03 } +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1171/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.9544455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43470 samples/s/p 5:30:04 } +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1173/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9542905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:55,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43289 samples/s/p 5:30:08 } +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1175/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.954135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43484 samples/s/p 5:29:58 } +2024-07-25 19:37:58,574 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:38:34,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1177/ 1625], loss: 1.273, per_step_time: 1575ms, lr: 2.9539795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:34,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.07887 samples/s/p 5:53:02 } +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1179/ 1625], loss: 1.146, per_step_time: 1477ms, lr: 2.9538238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.41502 samples/s/p 5:31:04 } +2024-07-25 19:38:40,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1181/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 2.9536677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:40,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43115 samples/s/p 5:30:02 } +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1183/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9535113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:43,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42482 samples/s/p 5:30:22 } +2024-07-25 19:38:46,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1185/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.9533547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:46,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43267 samples/s/p 5:29:51 } +2024-07-25 19:38:48,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1187/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9531979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:48,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43334 samples/s/p 5:29:45 } +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1189/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9530409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43792 samples/s/p 5:29:26 } +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1191/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.9528832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43729 samples/s/p 5:29:25 } +2024-07-25 19:38:57,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1193/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 2.9527255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:57,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42714 samples/s/p 5:29:59 } +2024-07-25 19:39:00,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1195/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.952568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:00,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43263 samples/s/p 5:29:36 } +2024-07-25 19:39:03,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1197/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.9524095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:03,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43150 samples/s/p 5:29:37 } +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1199/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.9522513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43244 samples/s/p 5:29:31 } +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1201/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 2.9520925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:09,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42316 samples/s/p 5:30:02 } +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1203/ 1625], loss: 1.131, per_step_time: 1469ms, lr: 2.9519335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.44224 samples/s/p 5:28:50 } +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1205/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.9517743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42901 samples/s/p 5:29:35 } +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1207/ 1625], loss: 1.056, per_step_time: 1474ms, lr: 2.951615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42665 samples/s/p 5:29:40 } +2024-07-25 19:39:21,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1209/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.9514551e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:21,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43086 samples/s/p 5:29:22 } +2024-07-25 19:39:24,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1211/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.9512954e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:24,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43787 samples/s/p 5:28:54 } +2024-07-25 19:39:27,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1213/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.951135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:27,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43503 samples/s/p 5:29:01 } +2024-07-25 19:39:30,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1215/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9509745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:30,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43679 samples/s/p 5:28:52 } +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1217/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.9508139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:33,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43810 samples/s/p 5:28:44 } +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1219/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.950653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42644 samples/s/p 5:29:23 } +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1221/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9504916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42829 samples/s/p 5:29:14 } +2024-07-25 19:39:42,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1223/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 2.95033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:42,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43098 samples/s/p 5:29:01 } +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1225/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.9501683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42847 samples/s/p 5:29:07 } +2024-07-25 19:39:48,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1227/ 1625], loss: 1.176, per_step_time: 1475ms, lr: 2.9500063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:48,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42119 samples/s/p 5:29:31 } +2024-07-25 19:39:50,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1229/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9498437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:50,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43175 samples/s/p 5:28:49 } +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1231/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.9496812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:53,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43272 samples/s/p 5:28:43 } +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1233/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9495186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43383 samples/s/p 5:28:36 } +2024-07-25 19:39:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1235/ 1625], loss: 1.037, per_step_time: 1473ms, lr: 2.9493556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42794 samples/s/p 5:28:54 } +2024-07-25 19:40:02,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1237/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9491921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:02,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42664 samples/s/p 5:28:56 } +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1239/ 1625], loss: 1.031, per_step_time: 1487ms, lr: 2.9490286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.37867 samples/s/p 5:31:49 } +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1241/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9488647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:08,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42688 samples/s/p 5:28:49 } +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1243/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9487004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43726 samples/s/p 5:28:09 } +2024-07-25 19:40:14,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 2.9485363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:14,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42539 samples/s/p 5:28:49 } +2024-07-25 19:40:17,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1247/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.9483715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:17,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42853 samples/s/p 5:28:35 } +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1249/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9482066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:20,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42473 samples/s/p 5:28:45 } +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1251/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.9480416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43448 samples/s/p 5:28:07 } +2024-07-25 19:40:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1253/ 1625], loss: 1.152, per_step_time: 1474ms, lr: 2.9478762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42630 samples/s/p 5:28:34 } +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1255/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 2.9477103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42564 samples/s/p 5:28:33 } +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1257/ 1625], loss: 1.254, per_step_time: 1473ms, lr: 2.9475446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42800 samples/s/p 5:28:22 } +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1259/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.9473786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43337 samples/s/p 5:27:59 } +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1261/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.947212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:38,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43039 samples/s/p 5:28:07 } +2024-07-25 19:40:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1263/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.9470451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43728 samples/s/p 5:27:39 } +2024-07-25 19:40:44,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1265/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.9468785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:44,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43762 samples/s/p 5:27:35 } +2024-07-25 19:40:47,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1267/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9467114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:47,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43342 samples/s/p 5:27:47 } +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1269/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9465436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:50,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43131 samples/s/p 5:27:52 } +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1271/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9463761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43204 samples/s/p 5:27:47 } +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1273/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9462082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43743 samples/s/p 5:27:24 } +2024-07-25 19:40:58,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1275/ 1625], loss: 1.209, per_step_time: 1475ms, lr: 2.94604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:58,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.42361 samples/s/p 5:28:11 } +2024-07-25 19:41:01,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1277/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.9458712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:01,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43991 samples/s/p 5:27:09 } +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1279/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.9457025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43177 samples/s/p 5:27:36 } +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1281/ 1625], loss: 1.315, per_step_time: 1474ms, lr: 2.9455336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.42587 samples/s/p 5:27:54 } +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1283/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9453642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43181 samples/s/p 5:27:30 } +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1285/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9451949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44110 samples/s/p 5:26:53 } +2024-07-25 19:41:16,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1287/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 2.945025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43989 samples/s/p 5:26:55 } +2024-07-25 19:41:19,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1289/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.944855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:19,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43081 samples/s/p 5:27:24 } +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1291/ 1625], loss: 1.329, per_step_time: 1469ms, lr: 2.9446848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44324 samples/s/p 5:26:37 } +2024-07-25 19:41:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1293/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 2.9445142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43091 samples/s/p 5:27:18 } +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1295/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9443434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43470 samples/s/p 5:27:02 } +2024-07-25 19:41:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1297/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.9441722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43008 samples/s/p 5:27:15 } +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1299/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.9440009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43419 samples/s/p 5:26:58 } +2024-07-25 19:41:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1301/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9438293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43764 samples/s/p 5:26:42 } +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1303/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.9436576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.42818 samples/s/p 5:27:13 } +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1305/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9434856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43754 samples/s/p 5:26:37 } +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1307/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.943313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43668 samples/s/p 5:26:37 } +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1309/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.9431405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44089 samples/s/p 5:26:19 } +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1311/ 1625], loss: 1.217, per_step_time: 1469ms, lr: 2.9429677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44430 samples/s/p 5:26:03 } +2024-07-25 19:41:55,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1313/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9427943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:55,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43328 samples/s/p 5:26:40 } +2024-07-25 19:41:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.9426212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43617 samples/s/p 5:26:27 } +2024-07-25 19:42:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1317/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.9424475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.42960 samples/s/p 5:26:48 } +2024-07-25 19:42:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1319/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9422736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:03,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43889 samples/s/p 5:26:11 } +2024-07-25 19:42:06,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1321/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 2.9420993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:06,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43247 samples/s/p 5:26:31 } +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1323/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.941925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43045 samples/s/p 5:26:36 } +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1325/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.9417504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:12,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43463 samples/s/p 5:26:18 } +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1327/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.9415754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43346 samples/s/p 5:26:19 } +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1329/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9414003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43648 samples/s/p 5:26:05 } +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1331/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.941225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43715 samples/s/p 5:26:00 } +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1333/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.941049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43150 samples/s/p 5:26:17 } +2024-07-25 19:42:27,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1335/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9408731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:27,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43219 samples/s/p 5:26:12 } +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1337/ 1625], loss: 1.186, per_step_time: 1480ms, lr: 2.940697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:30,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.40270 samples/s/p 5:27:56 } +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1339/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9405206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:33,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43353 samples/s/p 5:26:01 } +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1341/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.9403436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:36,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43567 samples/s/p 5:25:50 } +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1343/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9401668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:39,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42620 samples/s/p 5:26:22 } +2024-07-25 19:42:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1345/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 2.9399896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43169 samples/s/p 5:25:59 } +2024-07-25 19:42:45,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1347/ 1625], loss: 1.154, per_step_time: 1477ms, lr: 2.939812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:45,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.41518 samples/s/p 5:26:55 } +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1349/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9396344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43288 samples/s/p 5:25:49 } +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1351/ 1625], loss: 1.387, per_step_time: 1474ms, lr: 2.9394563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42625 samples/s/p 5:26:10 } +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1353/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 2.939278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42657 samples/s/p 5:26:05 } +2024-07-25 19:42:57,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1355/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.9390996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:57,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43157 samples/s/p 5:25:44 } +2024-07-25 19:42:59,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1357/ 1625], loss: 1.159, per_step_time: 1469ms, lr: 2.9389208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:59,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.44222 samples/s/p 5:25:03 } +2024-07-25 19:43:02,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1359/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.9387418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:02,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42913 samples/s/p 5:25:47 } +2024-07-25 19:43:05,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1361/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.9385625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:05,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43263 samples/s/p 5:25:32 } +2024-07-25 19:43:08,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1363/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.938383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:08,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43539 samples/s/p 5:25:19 } +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1365/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.938203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:11,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43617 samples/s/p 5:25:13 } +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1367/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.9380231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:14,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43203 samples/s/p 5:25:25 } +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1369/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9378429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43358 samples/s/p 5:25:17 } +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1371/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.9376622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43216 samples/s/p 5:25:19 } +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1373/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9374814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:23,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43296 samples/s/p 5:25:13 } +2024-07-25 19:43:26,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1375/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.9373005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:26,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43564 samples/s/p 5:25:00 } +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1377/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.937119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43229 samples/s/p 5:25:10 } +2024-07-25 19:43:32,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1379/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.9369374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:32,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43346 samples/s/p 5:25:02 } +2024-07-25 19:43:35,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1381/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.9367557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:35,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42615 samples/s/p 5:25:26 } +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1383/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.9365734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43078 samples/s/p 5:25:06 } +2024-07-25 19:43:41,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1385/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9363911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:41,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43682 samples/s/p 5:24:41 } +2024-07-25 19:43:44,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1387/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9362083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:44,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43239 samples/s/p 5:24:54 } +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1389/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.9360255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:47,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43473 samples/s/p 5:24:43 } +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1391/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 2.9358425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:50,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43129 samples/s/p 5:24:52 } +2024-07-25 19:43:53,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1393/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 2.9356592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:53,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43719 samples/s/p 5:24:28 } +2024-07-25 19:43:56,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1395/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.9354755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:56,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43068 samples/s/p 5:24:49 } +2024-07-25 19:43:59,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1397/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 2.9352916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43105 samples/s/p 5:24:44 } +2024-07-25 19:44:02,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1399/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.9351077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:02,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43134 samples/s/p 5:24:41 } +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1401/ 1625], loss: 1.078, per_step_time: 1476ms, lr: 2.934923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42000 samples/s/p 5:25:18 } +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1403/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9347384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43670 samples/s/p 5:24:15 } +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1405/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9345534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:10,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42955 samples/s/p 5:24:38 } +2024-07-25 19:44:13,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1407/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.9343682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:13,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42712 samples/s/p 5:24:44 } +2024-07-25 19:44:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1409/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.9341829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.44420 samples/s/p 5:23:40 } +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1411/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.9339972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43306 samples/s/p 5:24:17 } +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1413/ 1625], loss: 1.118, per_step_time: 1474ms, lr: 2.9338113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:22,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42414 samples/s/p 5:24:46 } +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1415/ 1625], loss: 1.077, per_step_time: 1474ms, lr: 2.9336252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:25,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42620 samples/s/p 5:24:35 } +2024-07-25 19:44:28,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1417/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9334386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43320 samples/s/p 5:24:07 } +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1419/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.933252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43017 samples/s/p 5:24:15 } +2024-07-25 19:44:34,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1421/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9330648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:34,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42656 samples/s/p 5:24:25 } +2024-07-25 19:44:37,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1423/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9328778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:37,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43372 samples/s/p 5:23:57 } +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1425/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 2.9326904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:40,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43098 samples/s/p 5:24:04 } +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1427/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 2.9325025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43587 samples/s/p 5:23:43 } +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1429/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 2.9323146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.42435 samples/s/p 5:24:21 } +2024-07-25 19:44:49,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1431/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.9321263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:49,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43746 samples/s/p 5:23:32 } +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1433/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.9319379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43607 samples/s/p 5:23:34 } +2024-07-25 19:44:55,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1435/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.931749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:55,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43776 samples/s/p 5:23:25 } +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1437/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.9315599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43582 samples/s/p 5:23:29 } +2024-07-25 19:45:01,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1439/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 2.931371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43907 samples/s/p 5:23:14 } +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1441/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:04,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42996 samples/s/p 5:23:44 } +2024-07-25 19:45:06,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1443/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 2.9309916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:06,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42033 samples/s/p 5:24:15 } +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1445/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.9308016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:09,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43357 samples/s/p 5:23:25 } +2024-07-25 19:45:12,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1447/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.9306113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:12,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43509 samples/s/p 5:23:16 } +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1449/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9304209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43525 samples/s/p 5:23:13 } +2024-07-25 19:45:18,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1451/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.93023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:18,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43741 samples/s/p 5:23:02 } +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1453/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.930039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43078 samples/s/p 5:23:23 } +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1455/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.9298477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43499 samples/s/p 5:23:05 } +2024-07-25 19:45:27,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1457/ 1625], loss: 1.217, per_step_time: 1475ms, lr: 2.9296561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:27,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42352 samples/s/p 5:23:43 } +2024-07-25 19:45:30,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1459/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 2.9294642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:30,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43968 samples/s/p 5:22:42 } +2024-07-25 19:45:33,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1461/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.9292723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:33,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42792 samples/s/p 5:23:21 } +2024-07-25 19:45:36,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1463/ 1625], loss: 1.388, per_step_time: 1475ms, lr: 2.9290799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:36,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42292 samples/s/p 5:23:36 } +2024-07-25 19:45:39,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1465/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.9288873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42967 samples/s/p 5:23:09 } +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1467/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.9286944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:42,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43775 samples/s/p 5:22:38 } +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1469/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.9285015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43348 samples/s/p 5:22:50 } +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1471/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.9283083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:48,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43486 samples/s/p 5:22:42 } +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1473/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 2.9281146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43906 samples/s/p 5:22:24 } +2024-07-25 19:45:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1475/ 1625], loss: 1.410, per_step_time: 1472ms, lr: 2.9279207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43380 samples/s/p 5:22:40 } +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1477/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.9277267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43241 samples/s/p 5:22:42 } +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1479/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9275321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:00,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43022 samples/s/p 5:22:47 } +2024-07-25 19:46:03,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1481/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 2.9273377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:03,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43359 samples/s/p 5:22:32 } +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1483/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.9271429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.44002 samples/s/p 5:22:06 } +2024-07-25 19:46:08,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1485/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9269479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:08,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43211 samples/s/p 5:22:31 } +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1487/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.9267525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43804 samples/s/p 5:22:07 } +2024-07-25 19:46:14,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1489/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.9265568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:14,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42831 samples/s/p 5:22:39 } +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1491/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.9263609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43422 samples/s/p 5:22:15 } +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.926165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43328 samples/s/p 5:22:15 } +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1495/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.9259685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42793 samples/s/p 5:22:31 } +2024-07-25 19:46:26,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1497/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9257719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:26,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42952 samples/s/p 5:22:23 } +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1499/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.9255749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43395 samples/s/p 5:22:04 } +2024-07-25 19:46:32,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1501/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.9253777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:32,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43170 samples/s/p 5:22:09 } +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1503/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.9251803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.44027 samples/s/p 5:21:36 } +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1505/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.9249826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:38,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42367 samples/s/p 5:22:32 } +2024-07-25 19:46:41,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1507/ 1625], loss: 0.925, per_step_time: 1474ms, lr: 2.9247849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:41,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42631 samples/s/p 5:22:19 } +2024-07-25 19:46:44,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1509/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 2.9245868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43859 samples/s/p 5:21:33 } +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1511/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9243884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42940 samples/s/p 5:22:02 } +2024-07-25 19:46:50,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1513/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.9241895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:50,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42848 samples/s/p 5:22:03 } +2024-07-25 19:46:53,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1515/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9239907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:53,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43274 samples/s/p 5:21:45 } +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1517/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9237914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43652 samples/s/p 5:21:28 } +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1519/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.923592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43230 samples/s/p 5:21:40 } +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1521/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9233923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43531 samples/s/p 5:21:27 } +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1523/ 1625], loss: 1.392, per_step_time: 1471ms, lr: 2.9231926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:05,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43626 samples/s/p 5:21:20 } +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1525/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9229921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43445 samples/s/p 5:21:24 } +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1527/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9227918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43757 samples/s/p 5:21:10 } +2024-07-25 19:47:13,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1529/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.922591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43578 samples/s/p 5:21:13 } +2024-07-25 19:47:16,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1531/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.92239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:16,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43718 samples/s/p 5:21:05 } +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1533/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.922189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43086 samples/s/p 5:21:25 } +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1535/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 2.9219877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:22,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.42870 samples/s/p 5:21:30 } +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1537/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9217857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43060 samples/s/p 5:21:20 } +2024-07-25 19:47:28,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1539/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9215838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43614 samples/s/p 5:20:57 } +2024-07-25 19:47:31,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1541/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.9213817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:31,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42987 samples/s/p 5:21:17 } +2024-07-25 19:47:34,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1543/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.9211793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:34,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42986 samples/s/p 5:21:14 } +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1545/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.9209765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43676 samples/s/p 5:20:46 } +2024-07-25 19:47:40,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1547/ 1625], loss: 1.248, per_step_time: 1474ms, lr: 2.9207737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:40,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42686 samples/s/p 5:21:18 } +2024-07-25 19:47:43,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1549/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.9205703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:43,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43324 samples/s/p 5:20:53 } +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1551/ 1625], loss: 1.156, per_step_time: 1474ms, lr: 2.9203668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42665 samples/s/p 5:21:13 } +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1553/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.920163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:49,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.42902 samples/s/p 5:21:02 } +2024-07-25 19:47:52,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1555/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9199591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:52,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43181 samples/s/p 5:20:49 } +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1557/ 1625], loss: 1.030, per_step_time: 1473ms, lr: 2.9197548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43089 samples/s/p 5:20:49 } +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1559/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9195504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43226 samples/s/p 5:20:42 } +2024-07-25 19:48:01,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1561/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.9193456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:01,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43394 samples/s/p 5:20:33 } +2024-07-25 19:48:04,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1563/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.9191406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:04,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43959 samples/s/p 5:20:10 } +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1565/ 1625], loss: 1.333, per_step_time: 1486ms, lr: 2.9189354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.38235 samples/s/p 5:23:31 } +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1567/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.9187298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.44035 samples/s/p 5:20:01 } +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1569/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.9185241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:13,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43998 samples/s/p 5:20:00 } +2024-07-25 19:48:15,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1571/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.9183184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:15,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42955 samples/s/p 5:20:34 } +2024-07-25 19:48:18,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1573/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.918112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:18,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43978 samples/s/p 5:19:54 } +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1575/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.9179055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43484 samples/s/p 5:20:09 } +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1577/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9176985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:24,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43152 samples/s/p 5:20:18 } +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1579/ 1625], loss: 1.100, per_step_time: 1478ms, lr: 2.9174918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:27,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.41081 samples/s/p 5:21:28 } +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1581/ 1625], loss: 1.237, per_step_time: 1474ms, lr: 2.9172843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42441 samples/s/p 5:20:37 } +2024-07-25 19:48:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1583/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.917077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43369 samples/s/p 5:20:01 } +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1585/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9168692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.42855 samples/s/p 5:20:16 } +2024-07-25 19:48:39,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1587/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.9166611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43948 samples/s/p 5:19:35 } +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1589/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.916453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43212 samples/s/p 5:19:58 } +2024-07-25 19:48:45,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1591/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.9162444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:45,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43574 samples/s/p 5:19:42 } +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1593/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.9160356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43335 samples/s/p 5:19:48 } +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1595/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.9158266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.44124 samples/s/p 5:19:17 } +2024-07-25 19:48:54,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1597/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.915617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:54,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43362 samples/s/p 5:19:41 } +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1599/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.9154075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43997 samples/s/p 5:19:15 } +2024-07-25 19:49:00,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1601/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.9151977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:00,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42462 samples/s/p 5:20:07 } +2024-07-25 19:49:03,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1603/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.9149878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:03,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43096 samples/s/p 5:19:41 } +2024-07-25 19:49:06,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1605/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 2.9147775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:06,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43347 samples/s/p 5:19:30 } +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1607/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.9145669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43291 samples/s/p 5:19:29 } +2024-07-25 19:49:12,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1609/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.914356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:12,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42624 samples/s/p 5:19:49 } +2024-07-25 19:49:15,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1611/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.914145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:15,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43468 samples/s/p 5:19:16 } +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1613/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9139337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43242 samples/s/p 5:19:21 } +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1615/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.9137222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43693 samples/s/p 5:19:03 } +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1617/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 2.9135103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.44204 samples/s/p 5:18:42 } +2024-07-25 19:49:26,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1619/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9132983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:26,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.42869 samples/s/p 5:19:26 } +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1621/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.913086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43926 samples/s/p 5:18:46 } +2024-07-25 19:49:32,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1623/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.9128734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:32,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43485 samples/s/p 5:18:58 } +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1625/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 2.9126608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:35,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42632 samples/s/p 5:19:25 } +2024-07-25 19:49:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 2/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 2.9124476e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42180 samples/s/p 5:19:38 } +2024-07-25 19:49:41,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 4/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.9122342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:41,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43115 samples/s/p 5:19:02 } +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 6/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 2.9120209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42967 samples/s/p 5:19:05 } +2024-07-25 19:49:47,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 8/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.911807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:47,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43186 samples/s/p 5:18:54 } +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 10/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.911593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43074 samples/s/p 5:18:55 } +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 12/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.9113786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43556 samples/s/p 5:18:35 } +2024-07-25 19:49:56,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 14/ 1625], loss: 1.333, per_step_time: 1470ms, lr: 2.911164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:56,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43866 samples/s/p 5:18:21 } +2024-07-25 19:49:59,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 16/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.9109493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:59,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42912 samples/s/p 5:18:52 } +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 18/ 1625], loss: 1.293, per_step_time: 1470ms, lr: 2.9107341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.44025 samples/s/p 5:18:10 } +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 20/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.910519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43348 samples/s/p 5:18:31 } +2024-07-25 19:50:08,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 22/ 1625], loss: 1.121, per_step_time: 1474ms, lr: 2.9103032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:08,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42738 samples/s/p 5:18:49 } +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.9100875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43611 samples/s/p 5:18:16 } +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 26/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.9098714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43360 samples/s/p 5:18:21 } +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 28/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9096549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:17,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43823 samples/s/p 5:18:02 } +2024-07-25 19:50:19,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 30/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.9094384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:19,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43264 samples/s/p 5:18:19 } +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 32/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 2.9092214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:22,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42443 samples/s/p 5:18:45 } +2024-07-25 19:50:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 34/ 1625], loss: 1.247, per_step_time: 1474ms, lr: 2.9090043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42533 samples/s/p 5:18:39 } +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 36/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 2.9087872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43981 samples/s/p 5:17:45 } +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 38/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.9085697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43527 samples/s/p 5:17:58 } +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 40/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9083518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:34,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43219 samples/s/p 5:18:06 } +2024-07-25 19:50:37,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 42/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.9081337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:37,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43413 samples/s/p 5:17:56 } +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 44/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 2.9079154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43271 samples/s/p 5:17:58 } +2024-07-25 19:50:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 46/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.9076968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:43,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44065 samples/s/p 5:17:27 } +2024-07-25 19:50:46,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 48/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9074781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:46,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43118 samples/s/p 5:17:57 } +2024-07-25 19:50:49,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 50/ 1625], loss: 1.345, per_step_time: 1469ms, lr: 2.907259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44226 samples/s/p 5:17:16 } +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 52/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9070396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43022 samples/s/p 5:17:55 } +2024-07-25 19:50:55,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 54/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9068198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43672 samples/s/p 5:17:29 } +2024-07-25 19:50:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 56/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.9066001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43131 samples/s/p 5:17:45 } +2024-07-25 19:51:01,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 58/ 1625], loss: 1.227, per_step_time: 1474ms, lr: 2.9063798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:01,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42534 samples/s/p 5:18:03 } +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 60/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9061597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:04,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43466 samples/s/p 5:17:28 } +2024-07-25 19:51:07,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 62/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9059389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:07,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42709 samples/s/p 5:17:51 } +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 64/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 2.9057182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43107 samples/s/p 5:17:34 } +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 66/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.905497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43128 samples/s/p 5:17:31 } +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 68/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9052757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43189 samples/s/p 5:17:26 } +2024-07-25 19:51:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 70/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.9050541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43525 samples/s/p 5:17:11 } +2024-07-25 19:51:21,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 72/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9048324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:21,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43307 samples/s/p 5:17:16 } +2024-07-25 19:51:24,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 74/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.9046103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:24,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43207 samples/s/p 5:17:16 } +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 76/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9043878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:27,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43154 samples/s/p 5:17:15 } +2024-07-25 19:51:30,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 78/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.9041654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:30,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43732 samples/s/p 5:16:52 } +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 80/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.9039425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:33,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42988 samples/s/p 5:17:15 } +2024-07-25 19:51:36,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 82/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9037194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:36,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43255 samples/s/p 5:17:03 } +2024-07-25 19:51:39,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 84/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 2.903496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:39,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42589 samples/s/p 5:17:23 } +2024-07-25 19:51:42,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 86/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 2.9032724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:42,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42297 samples/s/p 5:17:30 } +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 88/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.9030487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:45,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43636 samples/s/p 5:16:40 } +2024-07-25 19:51:48,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 90/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.9028244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:48,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43480 samples/s/p 5:16:43 } +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 92/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.9026001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43630 samples/s/p 5:16:35 } +2024-07-25 19:51:54,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 94/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.9023757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:54,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43516 samples/s/p 5:16:36 } +2024-07-25 19:51:57,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 96/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9021508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:57,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43543 samples/s/p 5:16:32 } +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 98/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.9019258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:00,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43872 samples/s/p 5:16:17 } +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 100/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9017005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.42900 samples/s/p 5:16:49 } +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 102/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.9014749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43769 samples/s/p 5:16:15 } +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 104/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.9012492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:09,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43358 samples/s/p 5:16:27 } +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 106/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.901023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43713 samples/s/p 5:16:11 } +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 108/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.9007966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43529 samples/s/p 5:16:15 } +2024-07-25 19:52:18,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 110/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.90057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:18,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43648 samples/s/p 5:16:08 } +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 112/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.900343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:21,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42773 samples/s/p 5:16:35 } +2024-07-25 19:52:23,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 114/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.900116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:23,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43174 samples/s/p 5:16:18 } +2024-07-25 19:52:26,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 116/ 1625], loss: 1.367, per_step_time: 1470ms, lr: 2.8998888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:26,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.44132 samples/s/p 5:15:42 } +2024-07-25 19:52:29,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 118/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.899661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43290 samples/s/p 5:16:08 } +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 120/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8994333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42820 samples/s/p 5:16:22 } +2024-07-25 19:52:35,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 122/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.8992054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:35,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43215 samples/s/p 5:16:05 } +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 124/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 2.898977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:38,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43904 samples/s/p 5:15:38 } +2024-07-25 19:52:41,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 126/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.8987482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:41,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43293 samples/s/p 5:15:56 } +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 128/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8985194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43338 samples/s/p 5:15:52 } +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 130/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.8982906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:47,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43049 samples/s/p 5:15:59 } +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 132/ 1625], loss: 1.306, per_step_time: 1474ms, lr: 2.8980612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:50,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42491 samples/s/p 5:16:16 } +2024-07-25 19:52:53,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 134/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.8978317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:53,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43117 samples/s/p 5:15:51 } +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 136/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.8976017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:56,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43017 samples/s/p 5:15:51 } +2024-07-25 19:52:59,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 138/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.8973716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:59,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43954 samples/s/p 5:15:16 } +2024-07-25 19:53:02,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 140/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.8971413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:02,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43062 samples/s/p 5:15:44 } +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 142/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8969109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:05,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43250 samples/s/p 5:15:34 } +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 144/ 1625], loss: 1.292, per_step_time: 1473ms, lr: 2.89668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:08,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43034 samples/s/p 5:15:39 } +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 146/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8964489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43635 samples/s/p 5:15:15 } +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 148/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8962177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43389 samples/s/p 5:15:21 } +2024-07-25 19:53:17,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 150/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8959861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:17,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43167 samples/s/p 5:15:26 } +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 152/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.895754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43050 samples/s/p 5:15:27 } +2024-07-25 19:53:23,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 154/ 1625], loss: 1.245, per_step_time: 1475ms, lr: 2.895522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42265 samples/s/p 5:15:51 } +2024-07-25 19:53:25,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 156/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.8952898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:25,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.44041 samples/s/p 5:14:46 } +2024-07-25 19:53:28,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 158/ 1625], loss: 1.305, per_step_time: 1473ms, lr: 2.8950573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:28,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42898 samples/s/p 5:15:23 } +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 160/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.8948245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42812 samples/s/p 5:15:23 } +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 162/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.8945915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43708 samples/s/p 5:14:49 } +2024-07-25 19:53:37,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 164/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.8943581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:37,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43201 samples/s/p 5:15:04 } +2024-07-25 19:53:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 166/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 2.8941244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43858 samples/s/p 5:14:38 } +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 168/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8938906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43582 samples/s/p 5:14:45 } +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 170/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.8936567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43207 samples/s/p 5:14:55 } +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 172/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.8934224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42328 samples/s/p 5:15:22 } +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 174/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.893188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43600 samples/s/p 5:14:35 } +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 176/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8929531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43433 samples/s/p 5:14:38 } +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 178/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.8927181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43477 samples/s/p 5:14:34 } +2024-07-25 19:54:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 180/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.892483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42911 samples/s/p 5:14:50 } +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 182/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.8922472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43031 samples/s/p 5:14:43 } +2024-07-25 19:54:07,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.8920114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:07,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43242 samples/s/p 5:14:33 } +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 186/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.8917755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43408 samples/s/p 5:14:24 } +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 188/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.8915392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43974 samples/s/p 5:14:02 } +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 190/ 1625], loss: 1.189, per_step_time: 1469ms, lr: 2.8913028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.44246 samples/s/p 5:13:49 } +2024-07-25 19:54:19,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 192/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.891066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:19,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43119 samples/s/p 5:14:25 } +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 194/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.890829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43871 samples/s/p 5:13:56 } +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 196/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.8905917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43939 samples/s/p 5:13:51 } +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 198/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8903542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43813 samples/s/p 5:13:52 } +2024-07-25 19:54:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 200/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.8901162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43448 samples/s/p 5:14:02 } +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 202/ 1625], loss: 0.911, per_step_time: 1472ms, lr: 2.8898783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43271 samples/s/p 5:14:05 } +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 204/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.8896402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43197 samples/s/p 5:14:05 } +2024-07-25 19:54:39,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 206/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.8894017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42912 samples/s/p 5:14:12 } +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 208/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 2.8891629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43801 samples/s/p 5:13:38 } +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 210/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 2.8889239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:45,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42730 samples/s/p 5:14:12 } +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 212/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.8886847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43571 samples/s/p 5:13:40 } +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 214/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 2.8884451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42596 samples/s/p 5:14:11 } +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 216/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.8882056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43627 samples/s/p 5:13:32 } +2024-07-25 19:54:57,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 218/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 2.8879656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:57,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43389 samples/s/p 5:13:38 } +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 220/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.8877253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43656 samples/s/p 5:13:26 } +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 222/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8874847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43355 samples/s/p 5:13:33 } +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 224/ 1625], loss: 1.312, per_step_time: 1474ms, lr: 2.8872442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:06,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42667 samples/s/p 5:13:54 } +2024-07-25 19:55:09,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 226/ 1625], loss: 1.336, per_step_time: 1474ms, lr: 2.8870032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:09,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42557 samples/s/p 5:13:55 } +2024-07-25 19:55:12,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 228/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8867618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:12,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43463 samples/s/p 5:13:20 } +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 230/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8865205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:15,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43405 samples/s/p 5:13:19 } +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 232/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 2.8862785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:18,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42834 samples/s/p 5:13:36 } +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 234/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 2.8860366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:21,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42734 samples/s/p 5:13:37 } +2024-07-25 19:55:24,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 236/ 1625], loss: 1.114, per_step_time: 1474ms, lr: 2.8857945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:24,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.42382 samples/s/p 5:13:46 } +2024-07-25 19:55:27,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 238/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.8855518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:27,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43285 samples/s/p 5:13:12 } +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 240/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.8853092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43214 samples/s/p 5:13:11 } +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 242/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.8850664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43661 samples/s/p 5:12:53 } +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 244/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 2.8848232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43542 samples/s/p 5:12:54 } +2024-07-25 19:55:38,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 246/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 2.8845798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:38,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.44022 samples/s/p 5:12:35 } +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 248/ 1625], loss: 1.535, per_step_time: 1470ms, lr: 2.884336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:41,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.44005 samples/s/p 5:12:32 } +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 250/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.884092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:44,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43421 samples/s/p 5:12:49 } +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 252/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.883848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43367 samples/s/p 5:12:48 } +2024-07-25 19:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 254/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8836035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43781 samples/s/p 5:12:31 } +2024-07-25 19:55:53,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 256/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.8833589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43855 samples/s/p 5:12:26 } +2024-07-25 19:55:56,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 258/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 2.883114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:56,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43333 samples/s/p 5:12:41 } +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 260/ 1625], loss: 1.411, per_step_time: 1473ms, lr: 2.8828688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42812 samples/s/p 5:12:56 } +2024-07-25 19:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 262/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 2.8826234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:02,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43196 samples/s/p 5:12:40 } +2024-07-25 19:56:05,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 264/ 1625], loss: 1.197, per_step_time: 1474ms, lr: 2.8823779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:05,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42604 samples/s/p 5:12:57 } +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 266/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.8821318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43184 samples/s/p 5:12:34 } +2024-07-25 19:56:11,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 268/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.8818857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:11,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43891 samples/s/p 5:12:07 } +2024-07-25 19:56:14,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 270/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.8816394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:14,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43949 samples/s/p 5:12:02 } +2024-07-25 19:56:17,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 272/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.8813927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:17,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43452 samples/s/p 5:12:16 } +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 274/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.8811459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43530 samples/s/p 5:12:10 } +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 276/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 2.8808987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42625 samples/s/p 5:12:39 } +2024-07-25 19:56:26,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 278/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.8806513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:26,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42816 samples/s/p 5:12:29 } +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 280/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.8804037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:29,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43587 samples/s/p 5:12:00 } +2024-07-25 19:56:31,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 282/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.8801558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42866 samples/s/p 5:12:22 } +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 284/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.8799077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:34,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43758 samples/s/p 5:11:48 } +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 286/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.8796594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43724 samples/s/p 5:11:46 } +2024-07-25 19:56:40,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 288/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.8794107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:40,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43974 samples/s/p 5:11:35 } +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 290/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.879162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:43,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43552 samples/s/p 5:11:46 } +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 292/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.8789127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43540 samples/s/p 5:11:44 } +2024-07-25 19:56:49,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 294/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.8786633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:49,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43578 samples/s/p 5:11:39 } +2024-07-25 19:56:52,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 296/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8784138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:52,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43511 samples/s/p 5:11:39 } +2024-07-25 19:56:55,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 298/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8781642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:55,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43318 samples/s/p 5:11:42 } +2024-07-25 19:56:58,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 300/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.8779139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:58,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43802 samples/s/p 5:11:23 } +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 302/ 1625], loss: 1.402, per_step_time: 1470ms, lr: 2.8776638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43997 samples/s/p 5:11:13 } +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 304/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.8774133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42742 samples/s/p 5:11:53 } +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 306/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.8771623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43241 samples/s/p 5:11:33 } +2024-07-25 19:57:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 308/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.8769113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43781 samples/s/p 5:11:12 } +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 310/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.87666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42778 samples/s/p 5:11:43 } +2024-07-25 19:57:16,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 312/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.8764085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:16,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43049 samples/s/p 5:11:31 } +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 314/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 2.8761566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42620 samples/s/p 5:11:43 } +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 316/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.8759046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43439 samples/s/p 5:11:12 } +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 318/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8756524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43339 samples/s/p 5:11:12 } +2024-07-25 19:57:28,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 320/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.8753999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:28,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43611 samples/s/p 5:11:00 } +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 322/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.875147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43300 samples/s/p 5:11:08 } +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 324/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8748942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.42772 samples/s/p 5:11:23 } +2024-07-25 19:57:36,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 326/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 2.8746406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43968 samples/s/p 5:10:39 } +2024-07-25 19:57:39,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 328/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.8743872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43305 samples/s/p 5:10:59 } +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 330/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8741335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43260 samples/s/p 5:10:57 } +2024-07-25 19:57:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 332/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.8738794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:45,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43757 samples/s/p 5:10:37 } +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 334/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.8736255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43423 samples/s/p 5:10:46 } +2024-07-25 19:57:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 336/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 2.8733708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:51,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43047 samples/s/p 5:10:56 } +2024-07-25 19:57:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 338/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8731161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:54,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43306 samples/s/p 5:10:44 } +2024-07-25 19:57:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 340/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8728611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:57,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43132 samples/s/p 5:10:47 } +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 342/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.872606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43757 samples/s/p 5:10:23 } +2024-07-25 19:58:03,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 344/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8723503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:03,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.42967 samples/s/p 5:10:47 } +2024-07-25 19:58:06,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 346/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.8720948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:06,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43197 samples/s/p 5:10:36 } +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 348/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.871839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43035 samples/s/p 5:10:38 } +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 350/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.8715825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:12,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.44027 samples/s/p 5:10:02 } +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 352/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8713264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43177 samples/s/p 5:10:28 } +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 354/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.8710696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43722 samples/s/p 5:10:06 } +2024-07-25 19:58:21,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 356/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.8708128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:21,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43143 samples/s/p 5:10:23 } +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 358/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 2.8705555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43609 samples/s/p 5:10:04 } +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 360/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.8702983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43820 samples/s/p 5:09:54 } +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 362/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8700404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43782 samples/s/p 5:09:52 } +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 364/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.8697825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.44007 samples/s/p 5:09:42 } +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 366/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.8695245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:35,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43656 samples/s/p 5:09:51 } +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 368/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.869266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:38,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43738 samples/s/p 5:09:45 } +2024-07-25 19:58:41,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 370/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.8690074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:41,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42909 samples/s/p 5:10:10 } +2024-07-25 19:58:44,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 372/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.8687486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:44,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43330 samples/s/p 5:09:53 } +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 374/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.8684895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43773 samples/s/p 5:09:35 } +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 376/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 2.8682301e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43679 samples/s/p 5:09:35 } +2024-07-25 19:58:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 378/ 1625], loss: 1.099, per_step_time: 1475ms, lr: 2.8679706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42096 samples/s/p 5:10:26 } +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 380/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.8677106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:56,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43172 samples/s/p 5:09:47 } +2024-07-25 19:58:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 382/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.8674505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:59,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43596 samples/s/p 5:09:29 } +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 384/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 2.8671904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43020 samples/s/p 5:09:46 } +2024-07-25 19:59:05,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 386/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.8669298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:05,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43375 samples/s/p 5:09:31 } +2024-07-25 19:59:08,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 388/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 2.8666691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:08,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43023 samples/s/p 5:09:40 } +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 390/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.866408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43425 samples/s/p 5:09:23 } +2024-07-25 19:59:14,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 392/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.8661465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:14,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.44098 samples/s/p 5:08:57 } +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 394/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.865885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43234 samples/s/p 5:09:24 } +2024-07-25 19:59:20,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 396/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8656234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:20,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43565 samples/s/p 5:09:10 } +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 398/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8653612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43275 samples/s/p 5:09:17 } +2024-07-25 19:59:26,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 400/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.865099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:26,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42983 samples/s/p 5:09:24 } +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 402/ 1625], loss: 0.941, per_step_time: 1470ms, lr: 2.8648365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.44015 samples/s/p 5:08:45 } +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 404/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8645738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43822 samples/s/p 5:08:49 } +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 406/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 2.8643106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43247 samples/s/p 5:09:06 } +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 408/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 2.8640474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42680 samples/s/p 5:09:22 } +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 410/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.863784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43537 samples/s/p 5:08:50 } +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 412/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8635202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:43,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43429 samples/s/p 5:08:51 } +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 414/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.8632563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43173 samples/s/p 5:08:56 } +2024-07-25 19:59:49,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 416/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8629922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:49,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43735 samples/s/p 5:08:34 } +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 418/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.8627277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43451 samples/s/p 5:08:41 } +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 420/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.8624629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:55,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43801 samples/s/p 5:08:26 } +2024-07-25 19:59:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 422/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.862198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43989 samples/s/p 5:08:17 } +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 424/ 1625], loss: 1.110, per_step_time: 1469ms, lr: 2.8619328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44308 samples/s/p 5:08:03 } +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 426/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.8616674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43528 samples/s/p 5:08:27 } +2024-07-25 20:00:07,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 428/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.8614015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:07,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44027 samples/s/p 5:08:07 } +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 430/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.8611357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43444 samples/s/p 5:08:24 } +2024-07-25 20:00:13,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 432/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.8608694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:13,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43731 samples/s/p 5:08:11 } +2024-07-25 20:00:16,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 434/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.8606033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:16,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.44045 samples/s/p 5:07:57 } +2024-07-25 20:00:19,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 436/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8603366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:19,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43268 samples/s/p 5:08:21 } +2024-07-25 20:00:22,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 438/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.8600698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:22,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43490 samples/s/p 5:08:10 } +2024-07-25 20:00:25,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 440/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.8598026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43821 samples/s/p 5:07:56 } +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 442/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8595354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43303 samples/s/p 5:08:11 } +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 444/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.8592678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43284 samples/s/p 5:08:09 } +2024-07-25 20:00:33,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 446/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.8589999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.42895 samples/s/p 5:08:19 } +2024-07-25 20:00:36,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 448/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.858732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:36,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43367 samples/s/p 5:08:00 } +2024-07-25 20:00:39,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 450/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.8584634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:39,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43587 samples/s/p 5:07:49 } +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 452/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.858195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:42,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42986 samples/s/p 5:08:07 } +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 454/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.8579261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43922 samples/s/p 5:07:32 } +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 456/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.857657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42887 samples/s/p 5:08:04 } +2024-07-25 20:00:51,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.8573877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:51,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42997 samples/s/p 5:07:58 } +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 460/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.8571181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42902 samples/s/p 5:07:58 } +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 462/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.8568486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43529 samples/s/p 5:07:34 } +2024-07-25 20:01:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 464/ 1625], loss: 1.383, per_step_time: 1473ms, lr: 2.8565784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42975 samples/s/p 5:07:50 } +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 466/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.8563083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.44123 samples/s/p 5:07:08 } +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 468/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 2.8560375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:06,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43636 samples/s/p 5:07:21 } +2024-07-25 20:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.8557668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42927 samples/s/p 5:07:42 } +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 472/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.855496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43160 samples/s/p 5:07:32 } +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 474/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8552247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:15,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43883 samples/s/p 5:07:04 } +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 476/ 1625], loss: 1.055, per_step_time: 1474ms, lr: 2.8549533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42424 samples/s/p 5:07:51 } +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 478/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8546816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43332 samples/s/p 5:07:17 } +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 480/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.8544096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43490 samples/s/p 5:07:09 } +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 482/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.8541375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43475 samples/s/p 5:07:06 } +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 484/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.853865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:30,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43659 samples/s/p 5:06:57 } +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 486/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.8535924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43606 samples/s/p 5:06:56 } +2024-07-25 20:01:35,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 488/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.8533195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:35,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43487 samples/s/p 5:06:57 } +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 490/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.8530465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:38,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43188 samples/s/p 5:07:04 } +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 492/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.8527731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43327 samples/s/p 5:06:56 } +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 494/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.8524992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:44,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43603 samples/s/p 5:06:44 } +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 496/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.8522254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43434 samples/s/p 5:06:47 } +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 498/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.8519513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43609 samples/s/p 5:06:38 } +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 500/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.8516772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:53,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43629 samples/s/p 5:06:34 } +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 502/ 1625], loss: 1.412, per_step_time: 1473ms, lr: 2.8514025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.42836 samples/s/p 5:06:58 } +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 504/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.8511276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:59,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43555 samples/s/p 5:06:31 } +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 506/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.8508526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43189 samples/s/p 5:06:40 } +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 508/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8505772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.44077 samples/s/p 5:06:07 } +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 510/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.8503016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:08,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43217 samples/s/p 5:06:34 } +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 512/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.8500259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:11,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43831 samples/s/p 5:06:10 } +2024-07-25 20:02:14,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 514/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.8497498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.42857 samples/s/p 5:06:40 } +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 516/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.8494736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:17,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43732 samples/s/p 5:06:07 } +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 518/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.849197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:20,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43147 samples/s/p 5:06:24 } +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 520/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8489203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:23,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43656 samples/s/p 5:06:04 } +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 522/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.8486435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:26,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43128 samples/s/p 5:06:19 } +2024-07-25 20:02:29,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 524/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.848366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:29,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.44009 samples/s/p 5:05:46 } +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 526/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.8480888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43570 samples/s/p 5:05:58 } +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 528/ 1625], loss: 1.487, per_step_time: 1470ms, lr: 2.8478109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43998 samples/s/p 5:05:41 } +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 530/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8475331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43189 samples/s/p 5:06:05 } +2024-07-25 20:02:40,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 532/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.8472548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43954 samples/s/p 5:05:36 } +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 534/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.8469765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43352 samples/s/p 5:05:54 } +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 536/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.8466979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43675 samples/s/p 5:05:40 } +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 538/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.846419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:49,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43634 samples/s/p 5:05:38 } +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 540/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.84614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43944 samples/s/p 5:05:25 } +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 542/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.8458602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:55,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43795 samples/s/p 5:05:27 } +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 544/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.845581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43839 samples/s/p 5:05:23 } +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 546/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.8453009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.42913 samples/s/p 5:05:51 } +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 548/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.845021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:04,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43848 samples/s/p 5:05:16 } +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 550/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.8447404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43508 samples/s/p 5:05:25 } +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 552/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 2.8444598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:10,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43261 samples/s/p 5:05:30 } +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 554/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.8441791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43591 samples/s/p 5:05:16 } +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 556/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.843898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43831 samples/s/p 5:05:05 } +2024-07-25 20:03:19,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 558/ 1625], loss: 1.013, per_step_time: 1469ms, lr: 2.8436167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:19,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.44374 samples/s/p 5:04:44 } +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 560/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 2.8433353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43028 samples/s/p 5:05:26 } +2024-07-25 20:03:25,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 562/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.8430537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43166 samples/s/p 5:05:19 } +2024-07-25 20:03:28,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 564/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.8427714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:28,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43822 samples/s/p 5:04:54 } +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 566/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8424893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.44053 samples/s/p 5:04:43 } +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 568/ 1625], loss: 1.203, per_step_time: 1476ms, lr: 2.8422068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.41720 samples/s/p 5:05:59 } +2024-07-25 20:03:36,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 570/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.8419241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:36,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43698 samples/s/p 5:04:49 } +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 572/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.841641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43830 samples/s/p 5:04:42 } +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 574/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.8413579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43269 samples/s/p 5:04:58 } +2024-07-25 20:03:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 576/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.8410743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43592 samples/s/p 5:04:44 } +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 578/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.8407909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43465 samples/s/p 5:04:45 } +2024-07-25 20:03:51,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 580/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.8405067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:51,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43650 samples/s/p 5:04:36 } +2024-07-25 20:03:54,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 582/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.8402226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:54,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43303 samples/s/p 5:04:45 } +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 584/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 2.8399383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.42483 samples/s/p 5:05:09 } +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 586/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 2.8396536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:00,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43152 samples/s/p 5:04:44 } +2024-07-25 20:04:03,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 588/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8393688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:03,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43623 samples/s/p 5:04:25 } +2024-07-25 20:04:06,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 590/ 1625], loss: 1.222, per_step_time: 1469ms, lr: 2.8390838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:06,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.44262 samples/s/p 5:04:01 } +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 592/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8387982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:09,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43741 samples/s/p 5:04:15 } +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 594/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.8385126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:12,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43851 samples/s/p 5:04:09 } +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 596/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.8382266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43376 samples/s/p 5:04:22 } +2024-07-25 20:04:18,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 598/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.8379409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:18,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43162 samples/s/p 5:04:26 } +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.8376546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:21,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43535 samples/s/p 5:04:10 } +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 602/ 1625], loss: 1.389, per_step_time: 1471ms, lr: 2.8373679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43585 samples/s/p 5:04:06 } +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 604/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.8370812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43797 samples/s/p 5:03:56 } +2024-07-25 20:04:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 606/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.8367942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:30,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.44129 samples/s/p 5:03:42 } +2024-07-25 20:04:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 608/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.836507e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43746 samples/s/p 5:03:52 } +2024-07-25 20:04:35,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 610/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 2.8362196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43941 samples/s/p 5:03:42 } +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 612/ 1625], loss: 1.135, per_step_time: 1474ms, lr: 2.835932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42492 samples/s/p 5:04:28 } +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 614/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.8356437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42914 samples/s/p 5:04:11 } +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 616/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.8353556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43490 samples/s/p 5:03:48 } +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 618/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.8350672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:47,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43787 samples/s/p 5:03:35 } +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 620/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.8347786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43762 samples/s/p 5:03:33 } +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 622/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.8344895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43800 samples/s/p 5:03:29 } +2024-07-25 20:04:56,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 624/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8342007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:56,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43930 samples/s/p 5:03:22 } +2024-07-25 20:04:59,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 626/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.8339113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:59,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43213 samples/s/p 5:03:43 } +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 628/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.8336215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43199 samples/s/p 5:03:40 } +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 630/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8333317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42951 samples/s/p 5:03:46 } +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 632/ 1625], loss: 1.066, per_step_time: 1474ms, lr: 2.8330414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:08,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42707 samples/s/p 5:03:51 } +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 634/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 2.8327513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:11,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43012 samples/s/p 5:03:38 } +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 636/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.8324606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43058 samples/s/p 5:03:33 } +2024-07-25 20:05:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 638/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 2.83217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:17,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43562 samples/s/p 5:03:14 } +2024-07-25 20:05:20,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 640/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.831879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:20,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43440 samples/s/p 5:03:15 } +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 642/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.8315875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43891 samples/s/p 5:02:57 } +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 644/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 2.831296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42841 samples/s/p 5:03:29 } +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 646/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.8310042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43735 samples/s/p 5:02:56 } +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 648/ 1625], loss: 1.377, per_step_time: 1474ms, lr: 2.8307122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42685 samples/s/p 5:03:28 } +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 650/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.8304199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:35,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44165 samples/s/p 5:02:36 } +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 652/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.8301274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43763 samples/s/p 5:02:46 } +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 654/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.8298351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.42874 samples/s/p 5:03:13 } +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 656/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.829542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:43,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43811 samples/s/p 5:02:39 } +2024-07-25 20:05:46,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 658/ 1625], loss: 1.197, per_step_time: 1470ms, lr: 2.829249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:46,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44065 samples/s/p 5:02:27 } +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 660/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.8289556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43595 samples/s/p 5:02:40 } +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 662/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.828662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43626 samples/s/p 5:02:36 } +2024-07-25 20:05:55,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 664/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 2.8283679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:55,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43176 samples/s/p 5:02:48 } +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 666/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8280738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43061 samples/s/p 5:02:49 } +2024-07-25 20:06:01,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 668/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.8277795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:01,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43398 samples/s/p 5:02:35 } +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 670/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.827485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:04,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43966 samples/s/p 5:02:13 } +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 672/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.8271901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:07,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43697 samples/s/p 5:02:19 } +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 674/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.826895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43740 samples/s/p 5:02:15 } +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 676/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.8265997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43924 samples/s/p 5:02:06 } +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 678/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.826304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43199 samples/s/p 5:02:27 } +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 680/ 1625], loss: 1.368, per_step_time: 1473ms, lr: 2.8260083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42904 samples/s/p 5:02:34 } +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 682/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.8257125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:22,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43478 samples/s/p 5:02:12 } +2024-07-25 20:06:25,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 684/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.8254162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:25,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43408 samples/s/p 5:02:11 } +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 686/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 2.8251197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:28,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.44399 samples/s/p 5:01:35 } +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 688/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8248229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43170 samples/s/p 5:02:13 } +2024-07-25 20:06:34,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 690/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.824526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42857 samples/s/p 5:02:21 } +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 692/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.8242288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:36,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43358 samples/s/p 5:02:01 } +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 694/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.8239314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43144 samples/s/p 5:02:05 } +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 696/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.8236338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:42,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43645 samples/s/p 5:01:45 } +2024-07-25 20:06:45,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 698/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.823336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:45,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43136 samples/s/p 5:01:59 } +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 700/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.8230377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43362 samples/s/p 5:01:49 } +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 702/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.8227394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43259 samples/s/p 5:01:49 } +2024-07-25 20:06:54,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 704/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.8224411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:54,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43005 samples/s/p 5:01:55 } +2024-07-25 20:06:57,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 706/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 2.822142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:57,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43672 samples/s/p 5:01:30 } +2024-07-25 20:07:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 708/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.8218434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42573 samples/s/p 5:02:03 } +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 710/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.821544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43038 samples/s/p 5:01:45 } +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.8212444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43488 samples/s/p 5:01:27 } +2024-07-25 20:07:09,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 714/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.8209444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:09,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43580 samples/s/p 5:01:21 } +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 716/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.8206448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43965 samples/s/p 5:01:05 } +2024-07-25 20:07:15,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 718/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.8203443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:15,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42635 samples/s/p 5:01:47 } +2024-07-25 20:07:18,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 720/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 2.8200438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:18,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43094 samples/s/p 5:01:28 } +2024-07-25 20:07:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 722/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.8197432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:21,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43841 samples/s/p 5:01:01 } +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 724/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8194423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:24,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43936 samples/s/p 5:00:55 } +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 726/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.819141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43586 samples/s/p 5:01:03 } +2024-07-25 20:07:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 728/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8188399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:30,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43066 samples/s/p 5:01:18 } +2024-07-25 20:07:33,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 730/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.818538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43060 samples/s/p 5:01:15 } +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 732/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8182361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43752 samples/s/p 5:00:49 } +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 734/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.817934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43475 samples/s/p 5:00:55 } +2024-07-25 20:07:41,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 736/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 2.8176317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:41,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43551 samples/s/p 5:00:50 } +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 738/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.817329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43362 samples/s/p 5:00:53 } +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 740/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.8170265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43871 samples/s/p 5:00:33 } +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 742/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.8167233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43667 samples/s/p 5:00:37 } +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 744/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.8164202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43309 samples/s/p 5:00:46 } +2024-07-25 20:07:56,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 746/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.8161166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:56,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43665 samples/s/p 5:00:31 } +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 748/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.8158129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:59,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43282 samples/s/p 5:00:41 } +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 750/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 2.815509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:02,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43891 samples/s/p 5:00:18 } +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 752/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.8152048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.42985 samples/s/p 5:00:45 } +2024-07-25 20:08:08,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 754/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 2.8149003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43974 samples/s/p 5:00:09 } +2024-07-25 20:08:11,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 756/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.8145956e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:11,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43499 samples/s/p 5:00:22 } +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 758/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 2.8142907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43736 samples/s/p 5:00:11 } +2024-07-25 20:08:17,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 760/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 2.8139855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:17,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43153 samples/s/p 5:00:28 } +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 762/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.8136801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43736 samples/s/p 5:00:05 } +2024-07-25 20:08:23,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 764/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 2.8133745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:23,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43055 samples/s/p 5:00:25 } +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 766/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.8130687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:26,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43805 samples/s/p 4:59:57 } +2024-07-25 20:08:29,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 768/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.8127626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43252 samples/s/p 5:00:13 } +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 770/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.8124563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43241 samples/s/p 5:00:10 } +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 772/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 2.8121498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43828 samples/s/p 4:59:48 } +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 774/ 1625], loss: 1.152, per_step_time: 1469ms, lr: 2.8118431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44304 samples/s/p 4:59:29 } +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 776/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.811536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:40,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43953 samples/s/p 4:59:38 } +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 778/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 2.8112287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43915 samples/s/p 4:59:36 } +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 780/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.8109214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43990 samples/s/p 4:59:30 } +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 782/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.8106135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43033 samples/s/p 4:59:59 } +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 784/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8103057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43224 samples/s/p 4:59:50 } +2024-07-25 20:08:55,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 786/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.8099974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:55,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44543 samples/s/p 4:59:03 } +2024-07-25 20:08:58,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 788/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.8096889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:58,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43420 samples/s/p 4:59:37 } +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 790/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.8093804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:01,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43936 samples/s/p 4:59:17 } +2024-07-25 20:09:04,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 792/ 1625], loss: 1.290, per_step_time: 1471ms, lr: 2.8090715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:04,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43789 samples/s/p 4:59:19 } +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 794/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.8087625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43791 samples/s/p 4:59:16 } +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 796/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.8084534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:10,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43251 samples/s/p 4:59:31 } +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 798/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.8081437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43045 samples/s/p 4:59:35 } +2024-07-25 20:09:16,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 800/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.8078339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:16,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43838 samples/s/p 4:59:06 } +2024-07-25 20:09:19,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 802/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.8075237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:19,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43186 samples/s/p 4:59:25 } +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 804/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.8072136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43120 samples/s/p 4:59:24 } +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 806/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.8069033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:25,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43396 samples/s/p 4:59:12 } +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 808/ 1625], loss: 1.130, per_step_time: 1469ms, lr: 2.8065924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:28,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44254 samples/s/p 4:58:41 } +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 810/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.8062814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:31,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43449 samples/s/p 4:59:04 } +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 812/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8059701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:34,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43888 samples/s/p 4:58:47 } +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 814/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 2.8056587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:36,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43647 samples/s/p 4:58:52 } +2024-07-25 20:09:39,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 816/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.8053471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:39,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43846 samples/s/p 4:58:42 } +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.8050354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43007 samples/s/p 4:59:07 } +2024-07-25 20:09:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 820/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8047232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44159 samples/s/p 4:58:26 } +2024-07-25 20:09:48,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 822/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.8044109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:48,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42696 samples/s/p 4:59:11 } +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 824/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.8040982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43407 samples/s/p 4:58:45 } +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 826/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.8037857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43682 samples/s/p 4:58:33 } +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 828/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 2.8034725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:57,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43931 samples/s/p 4:58:22 } +2024-07-25 20:10:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 830/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.8031593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42883 samples/s/p 4:58:53 } +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 832/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.8028457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43793 samples/s/p 4:58:20 } +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 834/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.802532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.44001 samples/s/p 4:58:11 } +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 836/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.8022181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43159 samples/s/p 4:58:35 } +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 838/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8019038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42771 samples/s/p 4:58:45 } +2024-07-25 20:10:15,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 840/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.8015895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:15,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43772 samples/s/p 4:58:09 } +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 842/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.8012748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43552 samples/s/p 4:58:14 } +2024-07-25 20:10:21,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 844/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 2.80096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:21,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44292 samples/s/p 4:57:46 } +2024-07-25 20:10:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 846/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 2.8006447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:24,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43974 samples/s/p 4:57:54 } +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 848/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 2.8003293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42941 samples/s/p 4:58:25 } +2024-07-25 20:10:30,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 850/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.8000139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:30,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43290 samples/s/p 4:58:10 } +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 852/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 2.799698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:33,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44220 samples/s/p 4:57:37 } +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 854/ 1625], loss: 1.300, per_step_time: 1470ms, lr: 2.7993821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:36,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44060 samples/s/p 4:57:39 } +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 856/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.7990658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43371 samples/s/p 4:57:59 } +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 858/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.7987491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43495 samples/s/p 4:57:52 } +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 860/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7984324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43269 samples/s/p 4:57:56 } +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 862/ 1625], loss: 1.279, per_step_time: 1469ms, lr: 2.7981154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:47,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44231 samples/s/p 4:57:22 } +2024-07-25 20:10:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 864/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.7977982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43490 samples/s/p 4:57:43 } +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 866/ 1625], loss: 0.923, per_step_time: 1470ms, lr: 2.7974807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44056 samples/s/p 4:57:22 } +2024-07-25 20:10:56,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 868/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 2.7971631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.42815 samples/s/p 4:58:00 } +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 870/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.7968452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:59,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.42998 samples/s/p 4:57:51 } +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 872/ 1625], loss: 1.453, per_step_time: 1471ms, lr: 2.7965272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:02,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43502 samples/s/p 4:57:31 } +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 874/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7962087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:05,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43310 samples/s/p 4:57:34 } +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 876/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.7958902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43377 samples/s/p 4:57:29 } +2024-07-25 20:11:11,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 878/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 2.7955713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:11,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43114 samples/s/p 4:57:35 } +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 880/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7952523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43595 samples/s/p 4:57:16 } +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 882/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.794933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43782 samples/s/p 4:57:07 } +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 884/ 1625], loss: 1.304, per_step_time: 1476ms, lr: 2.7946136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.41678 samples/s/p 4:58:14 } +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 886/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.7942939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43816 samples/s/p 4:57:00 } +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 888/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.7939739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.42946 samples/s/p 4:57:26 } +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 890/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7936538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43492 samples/s/p 4:57:05 } +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 892/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7933336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43290 samples/s/p 4:57:09 } +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 894/ 1625], loss: 1.138, per_step_time: 1469ms, lr: 2.7930128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.44319 samples/s/p 4:56:32 } +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 896/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.7926919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43247 samples/s/p 4:57:04 } +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 898/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 2.7923708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43164 samples/s/p 4:57:04 } +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 900/ 1625], loss: 1.450, per_step_time: 1472ms, lr: 2.7920494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43453 samples/s/p 4:56:52 } +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7917278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43696 samples/s/p 4:56:41 } +2024-07-25 20:11:49,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 904/ 1625], loss: 1.411, per_step_time: 1472ms, lr: 2.791406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43334 samples/s/p 4:56:50 } +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 906/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 2.791084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43964 samples/s/p 4:56:26 } +2024-07-25 20:11:55,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 908/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 2.7907618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:55,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43762 samples/s/p 4:56:30 } +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 910/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.7904392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:58,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.44018 samples/s/p 4:56:18 } +2024-07-25 20:12:01,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 912/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.7901167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:01,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.42915 samples/s/p 4:56:51 } +2024-07-25 20:12:04,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 914/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.7897937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:04,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43737 samples/s/p 4:56:22 } +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 916/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.7894706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43169 samples/s/p 4:56:37 } +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 918/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7891474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:10,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43285 samples/s/p 4:56:31 } +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 920/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.7888234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43959 samples/s/p 4:56:06 } +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 922/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7884998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:16,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43207 samples/s/p 4:56:27 } +2024-07-25 20:12:19,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 924/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.7881757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:19,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43809 samples/s/p 4:56:05 } +2024-07-25 20:12:22,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 926/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.7878514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43802 samples/s/p 4:56:02 } +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 928/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7875269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43592 samples/s/p 4:56:06 } +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 930/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 2.7872022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43665 samples/s/p 4:56:00 } +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 932/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.7868771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:31,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43554 samples/s/p 4:56:01 } +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 934/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.7865519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43994 samples/s/p 4:55:44 } +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 936/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.7862265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43821 samples/s/p 4:55:47 } +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 938/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.7859009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:39,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43363 samples/s/p 4:55:59 } +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 940/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.7855749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43798 samples/s/p 4:55:41 } +2024-07-25 20:12:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 942/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.7852488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:45,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43577 samples/s/p 4:55:46 } +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 944/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.7849223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:48,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43668 samples/s/p 4:55:40 } +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 946/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 2.7845957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.44074 samples/s/p 4:55:24 } +2024-07-25 20:12:54,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 948/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.7842689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:54,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43159 samples/s/p 4:55:50 } +2024-07-25 20:12:57,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 950/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.7839418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43802 samples/s/p 4:55:27 } +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 952/ 1625], loss: 1.211, per_step_time: 1813ms, lr: 2.7836148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 4.41132 samples/s/p 6:04:09 } +2024-07-25 20:13:35,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 954/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.783287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:35,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43442 samples/s/p 4:55:32 } +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 956/ 1625], loss: 1.364, per_step_time: 1472ms, lr: 2.7829592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43343 samples/s/p 4:55:33 } +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 958/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.7826314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:41,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43997 samples/s/p 4:55:08 } +2024-07-25 20:13:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 960/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 2.7823033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:44,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43486 samples/s/p 4:55:22 } +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 962/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.7819746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43909 samples/s/p 4:55:05 } +2024-07-25 20:13:50,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 964/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.7816463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:50,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43198 samples/s/p 4:55:26 } +2024-07-25 20:13:53,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 966/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.7813174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:53,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43667 samples/s/p 4:55:07 } +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 968/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.780988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43978 samples/s/p 4:54:54 } +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 970/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.7806589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43630 samples/s/p 4:55:03 } +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 972/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.7803293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:02,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43220 samples/s/p 4:55:13 } +2024-07-25 20:14:05,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 974/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7799997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:05,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43231 samples/s/p 4:55:10 } +2024-07-25 20:14:08,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 976/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.7796697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:08,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43353 samples/s/p 4:55:03 } +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 978/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.7793394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43456 samples/s/p 4:54:57 } +2024-07-25 20:14:14,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 980/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.7790089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43675 samples/s/p 4:54:47 } +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 982/ 1625], loss: 0.806, per_step_time: 1471ms, lr: 2.7786784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:17,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43538 samples/s/p 4:54:48 } +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 984/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.7783473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43696 samples/s/p 4:54:40 } +2024-07-25 20:14:23,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 986/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 2.7780163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:23,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43988 samples/s/p 4:54:28 } +2024-07-25 20:14:26,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 988/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7776849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43701 samples/s/p 4:54:34 } +2024-07-25 20:14:29,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 990/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 2.7773533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:29,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43950 samples/s/p 4:54:23 } +2024-07-25 20:14:32,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 992/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.7770213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:32,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43112 samples/s/p 4:54:47 } +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 994/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7766893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43422 samples/s/p 4:54:34 } +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 996/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.7763572e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43493 samples/s/p 4:54:29 } +2024-07-25 20:14:40,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 998/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 2.7760247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:40,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43884 samples/s/p 4:54:13 } +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1000/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.7756918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43283 samples/s/p 4:54:30 } +2024-07-25 20:14:46,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1002/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.775359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:46,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43894 samples/s/p 4:54:07 } +2024-07-25 20:14:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1004/ 1625], loss: 1.410, per_step_time: 1470ms, lr: 2.775026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.44069 samples/s/p 4:53:58 } +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1006/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.7746924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43995 samples/s/p 4:53:58 } +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1008/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 2.7743588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.42777 samples/s/p 4:54:35 } +2024-07-25 20:14:58,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1010/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.774025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:58,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43938 samples/s/p 4:53:54 } +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1012/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.7736909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43372 samples/s/p 4:54:09 } +2024-07-25 20:15:04,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1014/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.7733566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:04,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43929 samples/s/p 4:53:48 } +2024-07-25 20:15:07,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1016/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.7730222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:07,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43104 samples/s/p 4:54:12 } +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1018/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.7726874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43414 samples/s/p 4:53:59 } +2024-07-25 20:15:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1020/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.7723525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:13,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43983 samples/s/p 4:53:38 } +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1022/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.7720173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43433 samples/s/p 4:53:53 } +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1024/ 1625], loss: 1.382, per_step_time: 1474ms, lr: 2.7716818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42586 samples/s/p 4:54:17 } +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1026/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.771346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43144 samples/s/p 4:53:56 } +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1028/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.7710103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43453 samples/s/p 4:53:43 } +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1030/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.7706741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43082 samples/s/p 4:53:52 } +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1032/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.7703378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:31,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.44181 samples/s/p 4:53:14 } +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1034/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7700013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43606 samples/s/p 4:53:29 } +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.7696644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.44020 samples/s/p 4:53:13 } +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1038/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.7693275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43545 samples/s/p 4:53:25 } +2024-07-25 20:15:42,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1040/ 1625], loss: 1.193, per_step_time: 1474ms, lr: 2.7689903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:42,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42495 samples/s/p 4:53:57 } +2024-07-25 20:15:45,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1042/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.7686527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:45,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43783 samples/s/p 4:53:12 } +2024-07-25 20:15:48,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1044/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.768315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:48,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42967 samples/s/p 4:53:35 } +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1046/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.7679771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43633 samples/s/p 4:53:11 } +2024-07-25 20:15:54,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1048/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.7676391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:54,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43737 samples/s/p 4:53:04 } +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1050/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7673008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43619 samples/s/p 4:53:05 } +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1052/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.766962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43332 samples/s/p 4:53:12 } +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1054/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.7666232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43826 samples/s/p 4:52:53 } +2024-07-25 20:16:06,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1056/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.766284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:06,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43015 samples/s/p 4:53:16 } +2024-07-25 20:16:09,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1058/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.765945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:09,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43810 samples/s/p 4:52:47 } +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1060/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.7656057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42843 samples/s/p 4:53:16 } +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1062/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.7652659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43197 samples/s/p 4:53:01 } +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1064/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.764926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43004 samples/s/p 4:53:05 } +2024-07-25 20:16:21,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1066/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 2.764586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:21,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43680 samples/s/p 4:52:40 } +2024-07-25 20:16:24,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1068/ 1625], loss: 1.314, per_step_time: 1473ms, lr: 2.7642454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.42952 samples/s/p 4:53:00 } +2024-07-25 20:16:27,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1070/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.763905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43717 samples/s/p 4:52:33 } +2024-07-25 20:16:30,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1072/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.763564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:30,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43204 samples/s/p 4:52:46 } +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1074/ 1625], loss: 1.086, per_step_time: 1481ms, lr: 2.7632228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.39821 samples/s/p 4:54:34 } +2024-07-25 20:16:36,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1076/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.7628816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:36,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43452 samples/s/p 4:52:32 } +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1078/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 2.7625401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43790 samples/s/p 4:52:19 } +2024-07-25 20:16:41,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1080/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.7621985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:41,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43717 samples/s/p 4:52:18 } +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1082/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7618566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43640 samples/s/p 4:52:18 } +2024-07-25 20:16:47,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1084/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.7615144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:47,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43005 samples/s/p 4:52:35 } +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1086/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 2.7611719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.44020 samples/s/p 4:51:59 } +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1088/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 2.7608294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42635 samples/s/p 4:52:41 } +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1090/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.7604865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43694 samples/s/p 4:52:04 } +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1092/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.7601433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43510 samples/s/p 4:52:07 } +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1094/ 1625], loss: 1.117, per_step_time: 1475ms, lr: 2.7598004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:02,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42252 samples/s/p 4:52:45 } +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1096/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.7594568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43479 samples/s/p 4:52:02 } +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1098/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.759113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43471 samples/s/p 4:51:59 } +2024-07-25 20:17:11,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1100/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.758769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43736 samples/s/p 4:51:48 } +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1102/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7584249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43138 samples/s/p 4:52:04 } +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1104/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 2.7580805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:17,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43576 samples/s/p 4:51:47 } +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1106/ 1625], loss: 1.127, per_step_time: 1483ms, lr: 2.7577358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.39376 samples/s/p 4:54:01 } +2024-07-25 20:17:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1108/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.7573911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43113 samples/s/p 4:51:56 } +2024-07-25 20:17:26,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1110/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.7570459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43693 samples/s/p 4:51:35 } +2024-07-25 20:17:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1112/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7567006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43614 samples/s/p 4:51:34 } +2024-07-25 20:17:32,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1114/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.756355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:32,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43695 samples/s/p 4:51:29 } +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1116/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.7560092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.44137 samples/s/p 4:51:12 } +2024-07-25 20:17:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1118/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 2.7556633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43104 samples/s/p 4:51:42 } +2024-07-25 20:17:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1120/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.7553173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43290 samples/s/p 4:51:33 } +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1122/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7549708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42755 samples/s/p 4:51:47 } +2024-07-25 20:17:46,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1124/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.754624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:46,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43041 samples/s/p 4:51:35 } +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1126/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.7542774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:49,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42991 samples/s/p 4:51:34 } +2024-07-25 20:17:52,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1128/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.7539303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:52,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43430 samples/s/p 4:51:17 } +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1130/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.7535827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43982 samples/s/p 4:50:56 } +2024-07-25 20:17:58,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1132/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 2.7532353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44308 samples/s/p 4:50:43 } +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1134/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 2.7528875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43786 samples/s/p 4:50:56 } +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1136/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7525399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:04,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43390 samples/s/p 4:51:06 } +2024-07-25 20:18:07,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1138/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.7521915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:07,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43411 samples/s/p 4:51:03 } +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1140/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.751843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:10,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43562 samples/s/p 4:50:55 } +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1142/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.7514943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:13,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43679 samples/s/p 4:50:48 } +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1144/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.7511456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:16,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43277 samples/s/p 4:50:58 } +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1146/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.7507964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:19,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44029 samples/s/p 4:50:31 } +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1148/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.7504475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:22,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43528 samples/s/p 4:50:44 } +2024-07-25 20:18:25,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1150/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 2.7500977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:25,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43103 samples/s/p 4:50:55 } +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1152/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 2.7497483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44120 samples/s/p 4:50:19 } +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1154/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.749398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:31,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44129 samples/s/p 4:50:16 } +2024-07-25 20:18:34,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1156/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 2.7490478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:34,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43993 samples/s/p 4:50:17 } +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1158/ 1625], loss: 1.337, per_step_time: 1473ms, lr: 2.7486976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:37,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.42949 samples/s/p 4:50:48 } +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1160/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.7483471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43803 samples/s/p 4:50:18 } +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1162/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.7479962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43320 samples/s/p 4:50:30 } +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1164/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.747645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:45,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43033 samples/s/p 4:50:36 } +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1166/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.7472937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43537 samples/s/p 4:50:17 } +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1168/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.7469421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42798 samples/s/p 4:50:38 } +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1170/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.7465905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43622 samples/s/p 4:50:09 } +2024-07-25 20:18:57,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1172/ 1625], loss: 1.286, per_step_time: 1475ms, lr: 2.7462385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:57,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42321 samples/s/p 4:50:47 } +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1174/ 1625], loss: 1.341, per_step_time: 1473ms, lr: 2.7458864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:00,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43024 samples/s/p 4:50:22 } +2024-07-25 20:19:03,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1176/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.745534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:03,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42859 samples/s/p 4:50:24 } +2024-07-25 20:19:06,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1178/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.7451813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43119 samples/s/p 4:50:13 } +2024-07-25 20:19:09,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1180/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.7448285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:09,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43435 samples/s/p 4:50:00 } +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1182/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7444756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:12,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43178 samples/s/p 4:50:05 } +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.7441221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43606 samples/s/p 4:49:49 } +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1186/ 1625], loss: 1.384, per_step_time: 1471ms, lr: 2.7437689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43664 samples/s/p 4:49:44 } +2024-07-25 20:19:21,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1188/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.7434153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:21,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43727 samples/s/p 4:49:39 } +2024-07-25 20:19:24,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1190/ 1625], loss: 1.260, per_step_time: 1469ms, lr: 2.7430611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:24,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.44233 samples/s/p 4:49:20 } +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1192/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.742707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43158 samples/s/p 4:49:51 } +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1194/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.7423526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43006 samples/s/p 4:49:53 } +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1196/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.7419981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:33,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43255 samples/s/p 4:49:42 } +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1198/ 1625], loss: 1.360, per_step_time: 1474ms, lr: 2.7416432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42633 samples/s/p 4:49:59 } +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1200/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.7412882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43099 samples/s/p 4:49:41 } +2024-07-25 20:19:42,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1202/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.740933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:42,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43507 samples/s/p 4:49:25 } +2024-07-25 20:19:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1204/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.7405775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43590 samples/s/p 4:49:20 } +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1206/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.7402219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43192 samples/s/p 4:49:29 } +2024-07-25 20:19:50,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1208/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.7398659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:50,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43403 samples/s/p 4:49:20 } +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1210/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 2.7395097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42973 samples/s/p 4:49:31 } +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1212/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 2.7391534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43765 samples/s/p 4:49:02 } +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1214/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.7387967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.42770 samples/s/p 4:49:31 } +2024-07-25 20:20:02,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1216/ 1625], loss: 0.958, per_step_time: 1469ms, lr: 2.73844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.44460 samples/s/p 4:48:34 } +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1218/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.7380831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:05,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43611 samples/s/p 4:48:58 } +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1220/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.7377257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:08,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43750 samples/s/p 4:48:51 } +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1222/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7373682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:11,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43310 samples/s/p 4:49:02 } +2024-07-25 20:20:14,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1224/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.7370106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:14,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43688 samples/s/p 4:48:47 } +2024-07-25 20:20:17,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1226/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.7366526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:17,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43229 samples/s/p 4:48:59 } +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1228/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.7362947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:20,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43578 samples/s/p 4:48:45 } +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1230/ 1625], loss: 1.338, per_step_time: 1469ms, lr: 2.7359361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:23,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.44302 samples/s/p 4:48:19 } +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1232/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.7355776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43291 samples/s/p 4:48:48 } +2024-07-25 20:20:29,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1234/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.735219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:29,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43899 samples/s/p 4:48:26 } +2024-07-25 20:20:32,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1236/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.73486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:32,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43598 samples/s/p 4:48:32 } +2024-07-25 20:20:35,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1238/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.734501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:35,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.42688 samples/s/p 4:48:58 } +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1240/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.7341417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43408 samples/s/p 4:48:32 } +2024-07-25 20:20:41,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1242/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.733782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:41,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43726 samples/s/p 4:48:19 } +2024-07-25 20:20:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1244/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.7334221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43247 samples/s/p 4:48:32 } +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1246/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.733062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43643 samples/s/p 4:48:16 } +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1248/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.7327018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:49,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43082 samples/s/p 4:48:31 } +2024-07-25 20:20:52,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1250/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.732341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:52,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43223 samples/s/p 4:48:24 } +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1252/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.7319802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43789 samples/s/p 4:48:03 } +2024-07-25 20:20:58,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1254/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7316195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:58,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43474 samples/s/p 4:48:10 } +2024-07-25 20:21:01,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1256/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.7312582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:01,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43658 samples/s/p 4:48:01 } +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1258/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.7308968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43764 samples/s/p 4:47:55 } +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1260/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 2.7305352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:07,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.44016 samples/s/p 4:47:44 } +2024-07-25 20:21:10,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1262/ 1625], loss: 0.940, per_step_time: 1470ms, lr: 2.7301734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:10,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.44001 samples/s/p 4:47:41 } +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1264/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.7298112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:13,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43915 samples/s/p 4:47:41 } +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1266/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.729449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43769 samples/s/p 4:47:43 } +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1268/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.729087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43813 samples/s/p 4:47:38 } +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1270/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.728724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43340 samples/s/p 4:47:50 } +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1272/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.7283611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:25,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43604 samples/s/p 4:47:39 } +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1274/ 1625], loss: 1.105, per_step_time: 1482ms, lr: 2.727998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.39494 samples/s/p 4:49:48 } +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1276/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.7276346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43553 samples/s/p 4:47:35 } +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1278/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.7272712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43499 samples/s/p 4:47:34 } +2024-07-25 20:21:37,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1280/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.7269074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:37,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43396 samples/s/p 4:47:34 } +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1282/ 1625], loss: 0.872, per_step_time: 1471ms, lr: 2.7265432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:40,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43757 samples/s/p 4:47:20 } +2024-07-25 20:21:43,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1284/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.7261793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:43,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43695 samples/s/p 4:47:19 } +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1286/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.725815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:45,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43195 samples/s/p 4:47:32 } +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1288/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.7254502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43082 samples/s/p 4:47:32 } +2024-07-25 20:21:51,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1290/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.7250853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:51,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.44117 samples/s/p 4:46:56 } +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1292/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.72472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.42699 samples/s/p 4:47:38 } +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1294/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.7243548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43169 samples/s/p 4:47:21 } +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1296/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7239892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43487 samples/s/p 4:47:08 } +2024-07-25 20:22:03,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1298/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 2.7236234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:03,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43974 samples/s/p 4:46:49 } +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1300/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.7232578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43427 samples/s/p 4:47:04 } +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1302/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.7228914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:09,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43791 samples/s/p 4:46:49 } +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1304/ 1625], loss: 1.342, per_step_time: 1476ms, lr: 2.7225251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:12,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.41771 samples/s/p 4:47:50 } +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1306/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 2.7221586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43559 samples/s/p 4:46:50 } +2024-07-25 20:22:18,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1308/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7217915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:18,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43394 samples/s/p 4:46:53 } +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1310/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.7214248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43574 samples/s/p 4:46:44 } +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1312/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.7210575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43364 samples/s/p 4:46:48 } +2024-07-25 20:22:27,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1314/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 2.7206897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:27,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43988 samples/s/p 4:46:25 } +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1316/ 1625], loss: 1.173, per_step_time: 1474ms, lr: 2.7203223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:30,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42438 samples/s/p 4:47:11 } +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1318/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.7199543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43727 samples/s/p 4:46:28 } +2024-07-25 20:22:36,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1320/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.7195862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:36,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43765 samples/s/p 4:46:23 } +2024-07-25 20:22:39,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1322/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7192178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:39,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43286 samples/s/p 4:46:36 } +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1324/ 1625], loss: 1.350, per_step_time: 1473ms, lr: 2.7188493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42768 samples/s/p 4:46:49 } +2024-07-25 20:22:44,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1326/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.7184808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:44,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43769 samples/s/p 4:46:14 } +2024-07-25 20:22:47,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1328/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.7181119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:47,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43834 samples/s/p 4:46:09 } +2024-07-25 20:22:50,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1330/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.7177426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:50,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43400 samples/s/p 4:46:20 } +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1332/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 2.7173732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:53,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.44098 samples/s/p 4:45:55 } +2024-07-25 20:22:56,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1334/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7170036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:56,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43803 samples/s/p 4:46:02 } +2024-07-25 20:22:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1336/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7166338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43639 samples/s/p 4:46:04 } +2024-07-25 20:23:02,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1338/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.7162638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:02,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.42765 samples/s/p 4:46:29 } +2024-07-25 20:23:05,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1340/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7158934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:05,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43750 samples/s/p 4:45:54 } +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1342/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7155229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43765 samples/s/p 4:45:51 } +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1344/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.7151524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:11,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43726 samples/s/p 4:45:49 } +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1346/ 1625], loss: 0.929, per_step_time: 1471ms, lr: 2.7147813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:14,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43549 samples/s/p 4:45:52 } +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1348/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7144102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43554 samples/s/p 4:45:49 } +2024-07-25 20:23:20,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1350/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.7140388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:20,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43382 samples/s/p 4:45:51 } +2024-07-25 20:23:23,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1352/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.7136673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:23,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43458 samples/s/p 4:45:46 } +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1354/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7132955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43684 samples/s/p 4:45:36 } +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1356/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7129236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43201 samples/s/p 4:45:48 } +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1358/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 2.7125512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.44092 samples/s/p 4:45:17 } +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1360/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.712179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:35,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43081 samples/s/p 4:45:46 } +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1362/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.7118065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43086 samples/s/p 4:45:43 } +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1364/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.7114334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43122 samples/s/p 4:45:39 } +2024-07-25 20:23:44,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1366/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 2.7110606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:44,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42896 samples/s/p 4:45:43 } +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1368/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7106873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43252 samples/s/p 4:45:29 } +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1370/ 1625], loss: 1.202, per_step_time: 1481ms, lr: 2.7103139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.40044 samples/s/p 4:47:08 } +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1372/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.70994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43677 samples/s/p 4:45:10 } +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.709566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:55,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43646 samples/s/p 4:45:08 } +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1376/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.7091919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42968 samples/s/p 4:45:26 } +2024-07-25 20:24:01,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1378/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.7088177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:01,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43589 samples/s/p 4:45:04 } +2024-07-25 20:24:04,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1380/ 1625], loss: 1.158, per_step_time: 1484ms, lr: 2.7084432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:04,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.38744 samples/s/p 4:47:34 } +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1382/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.7080683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43395 samples/s/p 4:45:04 } +2024-07-25 20:24:10,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1384/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.7076932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:10,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43464 samples/s/p 4:44:59 } +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1386/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7073182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:13,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43600 samples/s/p 4:44:51 } +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1388/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.7069427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:16,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43264 samples/s/p 4:44:59 } +2024-07-25 20:24:19,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1390/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.706567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:19,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43103 samples/s/p 4:45:01 } +2024-07-25 20:24:22,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1392/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7061913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:22,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43064 samples/s/p 4:45:00 } +2024-07-25 20:24:25,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1394/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 2.7058151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:25,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42649 samples/s/p 4:45:10 } +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1396/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.705439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:28,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43481 samples/s/p 4:44:41 } +2024-07-25 20:24:31,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1398/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.7050624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:31,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43046 samples/s/p 4:44:51 } +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1400/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.7046857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43995 samples/s/p 4:44:18 } +2024-07-25 20:24:37,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1402/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.7043088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:37,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43544 samples/s/p 4:44:30 } +2024-07-25 20:24:40,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1404/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.7039318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:40,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43876 samples/s/p 4:44:16 } +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1406/ 1625], loss: 1.244, per_step_time: 1473ms, lr: 2.7035543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42880 samples/s/p 4:44:45 } +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1408/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.703177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43182 samples/s/p 4:44:32 } +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1410/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.702799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42767 samples/s/p 4:44:42 } +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1412/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.7024213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43322 samples/s/p 4:44:22 } +2024-07-25 20:24:54,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1414/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 2.702043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43833 samples/s/p 4:44:03 } +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.7016647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43581 samples/s/p 4:44:08 } +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1418/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7012862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43688 samples/s/p 4:44:02 } +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1420/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7009073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43060 samples/s/p 4:44:18 } +2024-07-25 20:25:06,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.7005282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:06,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43345 samples/s/p 4:44:07 } +2024-07-25 20:25:09,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1424/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.700149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:09,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43427 samples/s/p 4:44:01 } +2024-07-25 20:25:12,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1426/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.6997694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:12,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43904 samples/s/p 4:43:43 } +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1428/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6993897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:15,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43215 samples/s/p 4:44:02 } +2024-07-25 20:25:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1430/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.69901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43621 samples/s/p 4:43:46 } +2024-07-25 20:25:21,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1432/ 1625], loss: 1.159, per_step_time: 1475ms, lr: 2.69863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:21,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42195 samples/s/p 4:44:28 } +2024-07-25 20:25:24,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1434/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.6982496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:24,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43290 samples/s/p 4:43:51 } +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1436/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.697869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42855 samples/s/p 4:44:01 } +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1438/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.6974883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.44098 samples/s/p 4:43:19 } +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1440/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.6971074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43332 samples/s/p 4:43:40 } +2024-07-25 20:25:36,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1442/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.6967262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:36,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43765 samples/s/p 4:43:24 } +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1444/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.6963447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43196 samples/s/p 4:43:39 } +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1446/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.6959635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:42,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43274 samples/s/p 4:43:33 } +2024-07-25 20:25:45,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1448/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.6955817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:45,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43561 samples/s/p 4:43:21 } +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1450/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.6951997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:48,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43669 samples/s/p 4:43:15 } +2024-07-25 20:25:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1452/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.6948175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:50,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.44044 samples/s/p 4:43:00 } +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1454/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.6944352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43648 samples/s/p 4:43:10 } +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1456/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 2.6940525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:56,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.44304 samples/s/p 4:42:46 } +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1458/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.6936696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43268 samples/s/p 4:43:16 } +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1460/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.6932865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43628 samples/s/p 4:43:02 } +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1462/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.6929032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43846 samples/s/p 4:42:52 } +2024-07-25 20:26:08,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1464/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.69252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:08,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42708 samples/s/p 4:43:25 } +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1466/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.6921361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:11,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42957 samples/s/p 4:43:14 } +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1468/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.6917522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:14,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43464 samples/s/p 4:42:55 } +2024-07-25 20:26:17,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1470/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.691368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:17,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43427 samples/s/p 4:42:53 } +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1472/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 2.6909836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:20,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43086 samples/s/p 4:43:01 } +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1474/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.6905991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:23,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43697 samples/s/p 4:42:39 } +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1476/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6902144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43335 samples/s/p 4:42:47 } +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1478/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 2.6898295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43127 samples/s/p 4:42:51 } +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1480/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 2.6894442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.44298 samples/s/p 4:42:11 } +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1482/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.689059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43504 samples/s/p 4:42:33 } +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1484/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6886732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43486 samples/s/p 4:42:31 } +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1486/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.6882875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:41,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43955 samples/s/p 4:42:13 } +2024-07-25 20:26:44,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1488/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.6879015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:44,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43429 samples/s/p 4:42:27 } +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1490/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.6875154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43397 samples/s/p 4:42:25 } +2024-07-25 20:26:50,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 2.687129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:50,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43003 samples/s/p 4:42:34 } +2024-07-25 20:26:52,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1494/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.6867421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:52,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43653 samples/s/p 4:42:11 } +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1496/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.6863554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43987 samples/s/p 4:41:58 } +2024-07-25 20:26:58,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1498/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.6859683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:58,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43389 samples/s/p 4:42:13 } +2024-07-25 20:27:01,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1500/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.685581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:01,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43718 samples/s/p 4:42:00 } +2024-07-25 20:27:04,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1502/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.6851938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:04,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43626 samples/s/p 4:42:00 } +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1504/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.6848062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:07,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43361 samples/s/p 4:42:05 } +2024-07-25 20:27:10,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1506/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.6844182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:10,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43599 samples/s/p 4:41:55 } +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1508/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.68403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:13,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43740 samples/s/p 4:41:48 } +2024-07-25 20:27:16,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1510/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 2.6836418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:16,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43025 samples/s/p 4:42:07 } +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1512/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6832533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43239 samples/s/p 4:41:57 } +2024-07-25 20:27:22,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1514/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.6828646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:22,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43591 samples/s/p 4:41:43 } +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1516/ 1625], loss: 1.383, per_step_time: 1469ms, lr: 2.6824755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:25,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.44341 samples/s/p 4:41:17 } +2024-07-25 20:27:28,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1518/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.6820864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43850 samples/s/p 4:41:29 } +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1520/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6816972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:31,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43167 samples/s/p 4:41:48 } +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1473ms, lr: 2.6813075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42901 samples/s/p 4:41:53 } +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1524/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.6809177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42784 samples/s/p 4:41:54 } +2024-07-25 20:27:40,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1526/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.6805277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:40,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43348 samples/s/p 4:41:33 } +2024-07-25 20:27:43,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1528/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 2.6801375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:43,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.44020 samples/s/p 4:41:09 } +2024-07-25 20:27:46,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1530/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.679747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:46,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42875 samples/s/p 4:41:42 } +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1532/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.6793565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43456 samples/s/p 4:41:21 } +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1534/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6789658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43530 samples/s/p 4:41:16 } +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1536/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6785747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43261 samples/s/p 4:41:21 } +2024-07-25 20:27:57,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1538/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.6781836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:57,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.42503 samples/s/p 4:41:42 } +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1540/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.6777923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:00,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43763 samples/s/p 4:41:00 } +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1542/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.6774005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43951 samples/s/p 4:40:51 } +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1544/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.6770087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43875 samples/s/p 4:40:50 } +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1546/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.6766167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43249 samples/s/p 4:41:07 } +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1548/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.6762244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43335 samples/s/p 4:41:01 } +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1550/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.675832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43427 samples/s/p 4:40:55 } +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1552/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6754393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:18,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43737 samples/s/p 4:40:43 } +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1554/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.6750464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.42956 samples/s/p 4:41:04 } +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1556/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.6746531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43911 samples/s/p 4:40:32 } +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1558/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.67426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43599 samples/s/p 4:40:38 } +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1560/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6738662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:30,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43815 samples/s/p 4:40:29 } +2024-07-25 20:28:33,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1562/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.6734724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:33,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43972 samples/s/p 4:40:21 } +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1564/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 2.6730788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43959 samples/s/p 4:40:18 } +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1566/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.6726846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43581 samples/s/p 4:40:27 } +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1568/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.67229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43821 samples/s/p 4:40:17 } +2024-07-25 20:28:45,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1570/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.6718957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:45,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43391 samples/s/p 4:40:27 } +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1572/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.671501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:48,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43170 samples/s/p 4:40:31 } +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1574/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.6711057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43726 samples/s/p 4:40:11 } +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1576/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 2.6707106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.42733 samples/s/p 4:40:39 } +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1578/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.6703154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43819 samples/s/p 4:40:02 } +2024-07-25 20:28:59,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1580/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6699196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:59,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43541 samples/s/p 4:40:08 } +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1582/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.6695237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44147 samples/s/p 4:39:46 } +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1584/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 2.669128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44029 samples/s/p 4:39:47 } +2024-07-25 20:29:08,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1586/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.6687318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43542 samples/s/p 4:39:59 } +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1588/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6683352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:11,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43402 samples/s/p 4:40:00 } +2024-07-25 20:29:14,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1590/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.6679389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:14,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43810 samples/s/p 4:39:45 } +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1592/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.667542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:17,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43364 samples/s/p 4:39:56 } +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1594/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.667145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43320 samples/s/p 4:39:54 } +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1596/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 2.6667478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43321 samples/s/p 4:39:51 } +2024-07-25 20:29:26,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1598/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6663502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:26,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43568 samples/s/p 4:39:40 } +2024-07-25 20:29:29,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1600/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.6659527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:29,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43799 samples/s/p 4:39:30 } +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1602/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.6655547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43157 samples/s/p 4:39:47 } +2024-07-25 20:29:35,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1604/ 1625], loss: 1.150, per_step_time: 1481ms, lr: 2.6651567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:35,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.39861 samples/s/p 4:41:27 } +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1606/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 2.6647582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:38,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.42818 samples/s/p 4:39:52 } +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1608/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.66436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43343 samples/s/p 4:39:33 } +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1610/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6639615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43570 samples/s/p 4:39:23 } +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1612/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6635624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43792 samples/s/p 4:39:13 } +2024-07-25 20:29:50,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1614/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.6631631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:50,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43206 samples/s/p 4:39:28 } +2024-07-25 20:29:53,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1616/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.6627638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:53,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43332 samples/s/p 4:39:21 } +2024-07-25 20:29:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1618/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.6623644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43829 samples/s/p 4:39:03 } +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1620/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.6619646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:58,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43111 samples/s/p 4:39:22 } +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1622/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.6615648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43409 samples/s/p 4:39:10 } +2024-07-25 20:30:04,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1624/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.661165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:04,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43777 samples/s/p 4:38:56 } +2024-07-25 20:30:07,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.6607646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43462 samples/s/p 4:39:03 } +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 3/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.660364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43728 samples/s/p 4:38:51 } +2024-07-25 20:30:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 5/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6599633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:13,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43757 samples/s/p 4:38:48 } +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 7/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.6595622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.44006 samples/s/p 4:38:37 } +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 9/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.6591613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43721 samples/s/p 4:38:43 } +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 11/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.6587599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:22,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43833 samples/s/p 4:38:36 } +2024-07-25 20:30:25,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 13/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.6583582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:25,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.42901 samples/s/p 4:39:02 } +2024-07-25 20:30:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 15/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6579564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43840 samples/s/p 4:38:30 } +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 17/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6575546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:31,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43355 samples/s/p 4:38:42 } +2024-07-25 20:30:34,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 19/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.6571523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:34,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43504 samples/s/p 4:38:35 } +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 21/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.6567499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43808 samples/s/p 4:38:22 } +2024-07-25 20:30:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 23/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6563475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43399 samples/s/p 4:38:32 } +2024-07-25 20:30:43,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 25/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.6559446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43346 samples/s/p 4:38:31 } +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 27/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6555417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43604 samples/s/p 4:38:20 } +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 29/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.6551385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43457 samples/s/p 4:38:21 } +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 31/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.654735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:52,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43780 samples/s/p 4:38:09 } +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 33/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 2.6543314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43718 samples/s/p 4:38:08 } +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 35/ 1625], loss: 1.309, per_step_time: 1471ms, lr: 2.6539275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43622 samples/s/p 4:38:08 } +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 37/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.6535236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43431 samples/s/p 4:38:10 } +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 39/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.6531194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43460 samples/s/p 4:38:07 } +2024-07-25 20:31:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 41/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.652715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43313 samples/s/p 4:38:08 } +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 43/ 1625], loss: 1.054, per_step_time: 1473ms, lr: 2.6523103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:09,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.42962 samples/s/p 4:38:16 } +2024-07-25 20:31:12,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 45/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.6519056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:12,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43591 samples/s/p 4:37:54 } +2024-07-25 20:31:15,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 47/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.6515005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:15,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43563 samples/s/p 4:37:52 } +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 49/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.6510952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43176 samples/s/p 4:38:01 } +2024-07-25 20:31:21,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 51/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.6506901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:21,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43587 samples/s/p 4:37:45 } +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 53/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.6502841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43949 samples/s/p 4:37:31 } +2024-07-25 20:31:27,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 55/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 2.6498787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:27,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43080 samples/s/p 4:37:55 } +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 57/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.6494725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:30,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43307 samples/s/p 4:37:45 } +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 59/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 2.6490663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:33,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43260 samples/s/p 4:37:43 } +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 61/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.64866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44091 samples/s/p 4:37:15 } +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 63/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6482532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43261 samples/s/p 4:37:37 } +2024-07-25 20:31:42,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 65/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.6478463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:42,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43627 samples/s/p 4:37:23 } +2024-07-25 20:31:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 67/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.6474394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43069 samples/s/p 4:37:37 } +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 69/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 2.6470321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43910 samples/s/p 4:37:09 } +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 71/ 1625], loss: 1.243, per_step_time: 1469ms, lr: 2.6466245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44229 samples/s/p 4:36:56 } +2024-07-25 20:31:53,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 73/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 2.6462169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:53,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43917 samples/s/p 4:37:03 } +2024-07-25 20:31:56,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 75/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.645809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:56,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43845 samples/s/p 4:37:02 } +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 77/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.645401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43596 samples/s/p 4:37:07 } +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 79/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.6449929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43271 samples/s/p 4:37:14 } +2024-07-25 20:32:05,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 81/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.6445841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:05,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43447 samples/s/p 4:37:05 } +2024-07-25 20:32:08,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 83/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.6441756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43828 samples/s/p 4:36:51 } +2024-07-25 20:32:11,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 85/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 2.6437665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:11,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43538 samples/s/p 4:36:57 } +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 87/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.6433578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:14,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43447 samples/s/p 4:36:56 } +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 89/ 1625], loss: 0.988, per_step_time: 1472ms, lr: 2.6429483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43368 samples/s/p 4:36:56 } +2024-07-25 20:32:20,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 91/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.642539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:20,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43562 samples/s/p 4:36:47 } +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 93/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.6421292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43341 samples/s/p 4:36:51 } +2024-07-25 20:32:26,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 95/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.6417194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:26,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43823 samples/s/p 4:36:33 } +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 97/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.6413092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:29,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43344 samples/s/p 4:36:45 } +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 99/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.640899e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43812 samples/s/p 4:36:28 } +2024-07-25 20:32:35,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 101/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.6404885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:35,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.44132 samples/s/p 4:36:15 } +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 103/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.640078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:38,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43262 samples/s/p 4:36:38 } +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 105/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.639667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43241 samples/s/p 4:36:36 } +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 107/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.639256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:44,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43794 samples/s/p 4:36:16 } +2024-07-25 20:32:47,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 109/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6388447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:47,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43694 samples/s/p 4:36:16 } +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 111/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.6384332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.44261 samples/s/p 4:35:56 } +2024-07-25 20:32:52,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 113/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.6380214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:52,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43749 samples/s/p 4:36:09 } +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 115/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.6376096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:55,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43290 samples/s/p 4:36:20 } +2024-07-25 20:32:58,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 117/ 1625], loss: 1.172, per_step_time: 1474ms, lr: 2.6371974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:58,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42526 samples/s/p 4:36:40 } +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 119/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.6367852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42528 samples/s/p 4:36:37 } +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 121/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 2.6363727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43485 samples/s/p 4:36:05 } +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 123/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.63596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:07,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43780 samples/s/p 4:35:53 } +2024-07-25 20:33:10,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 125/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.635547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:10,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43622 samples/s/p 4:35:55 } +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 127/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.635134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:13,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43166 samples/s/p 4:36:06 } +2024-07-25 20:33:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 129/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6347207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.44017 samples/s/p 4:35:37 } +2024-07-25 20:33:19,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 131/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.6343072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43631 samples/s/p 4:35:46 } +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 133/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.6338936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43759 samples/s/p 4:35:39 } +2024-07-25 20:33:25,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 135/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.6334796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:25,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43022 samples/s/p 4:35:59 } +2024-07-25 20:33:28,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 137/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.6330656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:28,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43910 samples/s/p 4:35:29 } +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 139/ 1625], loss: 1.209, per_step_time: 1474ms, lr: 2.632651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.42509 samples/s/p 4:36:08 } +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 141/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.6322365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43817 samples/s/p 4:35:26 } +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 143/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.6318221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43726 samples/s/p 4:35:25 } +2024-07-25 20:33:40,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 145/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.631407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43152 samples/s/p 4:35:40 } +2024-07-25 20:33:43,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 147/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.6309921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:43,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43291 samples/s/p 4:35:33 } +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 149/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 2.6305768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43605 samples/s/p 4:35:20 } +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 151/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.6301614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43849 samples/s/p 4:35:10 } +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 153/ 1625], loss: 1.080, per_step_time: 1469ms, lr: 2.6297457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:52,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.44360 samples/s/p 4:34:52 } +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 155/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.6293299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43941 samples/s/p 4:35:01 } +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 157/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.6289135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43820 samples/s/p 4:35:02 } +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 159/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.6284974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43671 samples/s/p 4:35:04 } +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 161/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 2.6280808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43171 samples/s/p 4:35:16 } +2024-07-25 20:34:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 163/ 1625], loss: 1.125, per_step_time: 1474ms, lr: 2.6276643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42404 samples/s/p 4:35:36 } +2024-07-25 20:34:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 165/ 1625], loss: 1.003, per_step_time: 1469ms, lr: 2.6272473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.44274 samples/s/p 4:34:37 } +2024-07-25 20:34:12,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 167/ 1625], loss: 1.246, per_step_time: 1474ms, lr: 2.6268302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:12,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42471 samples/s/p 4:35:28 } +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 169/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.6264128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42861 samples/s/p 4:35:13 } +2024-07-25 20:34:18,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 171/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.6259953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:18,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43519 samples/s/p 4:34:51 } +2024-07-25 20:34:21,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 173/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.6255777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:21,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43504 samples/s/p 4:34:48 } +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 175/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.6251599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43107 samples/s/p 4:34:57 } +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 177/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.624742e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:27,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43465 samples/s/p 4:34:43 } +2024-07-25 20:34:30,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 179/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.6243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:30,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43163 samples/s/p 4:34:50 } +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 181/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 2.6239051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43609 samples/s/p 4:34:33 } +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 183/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.6234866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:36,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43783 samples/s/p 4:34:25 } +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 185/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.6230677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43216 samples/s/p 4:34:39 } +2024-07-25 20:34:42,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 187/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.6226486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:42,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42465 samples/s/p 4:34:59 } +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 189/ 1625], loss: 1.125, per_step_time: 1469ms, lr: 2.6222293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:45,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.44478 samples/s/p 4:33:55 } +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 191/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.6218097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43247 samples/s/p 4:34:29 } +2024-07-25 20:34:51,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 193/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.6213902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:51,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43182 samples/s/p 4:34:28 } +2024-07-25 20:34:54,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 195/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.6209704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:54,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43359 samples/s/p 4:34:20 } +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 197/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 2.6205502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42883 samples/s/p 4:34:32 } +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 199/ 1625], loss: 1.157, per_step_time: 1474ms, lr: 2.6201298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42380 samples/s/p 4:34:44 } +2024-07-25 20:35:02,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 201/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.6197094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:02,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43082 samples/s/p 4:34:20 } +2024-07-25 20:35:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 203/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.6192887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:05,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42891 samples/s/p 4:34:22 } +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 205/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.618868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43566 samples/s/p 4:33:59 } +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 207/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.618447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43584 samples/s/p 4:33:56 } +2024-07-25 20:35:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 209/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.6180256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:14,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43803 samples/s/p 4:33:46 } +2024-07-25 20:35:17,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 211/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 2.6176042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:17,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43650 samples/s/p 4:33:48 } +2024-07-25 20:35:20,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 213/ 1625], loss: 1.308, per_step_time: 1470ms, lr: 2.6171825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:20,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.44014 samples/s/p 4:33:34 } +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 215/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.6167607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:23,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43506 samples/s/p 4:33:46 } +2024-07-25 20:35:26,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 217/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6163387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:26,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43294 samples/s/p 4:33:50 } +2024-07-25 20:35:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 219/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.6159165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43628 samples/s/p 4:33:37 } +2024-07-25 20:35:32,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 221/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.615494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:32,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43724 samples/s/p 4:33:31 } +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 223/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.6150716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43804 samples/s/p 4:33:25 } +2024-07-25 20:35:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 225/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.6146485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.42977 samples/s/p 4:33:47 } +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 227/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.6142256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43830 samples/s/p 4:33:19 } +2024-07-25 20:35:44,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 229/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6138026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43695 samples/s/p 4:33:20 } +2024-07-25 20:35:47,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 231/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.613379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:47,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43645 samples/s/p 4:33:18 } +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 233/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.6129554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43439 samples/s/p 4:33:22 } +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 235/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.6125317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43695 samples/s/p 4:33:11 } +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.6121077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43680 samples/s/p 4:33:09 } +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 239/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.6116835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43483 samples/s/p 4:33:12 } +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 241/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.611259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43691 samples/s/p 4:33:02 } +2024-07-25 20:36:04,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 243/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 2.6108346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:04,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.42955 samples/s/p 4:33:22 } +2024-07-25 20:36:07,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.6104097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43657 samples/s/p 4:32:57 } +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 247/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.6099848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43059 samples/s/p 4:33:13 } +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 249/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.6095595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.44078 samples/s/p 4:32:39 } +2024-07-25 20:36:16,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 251/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6091344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:16,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43609 samples/s/p 4:32:50 } +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 253/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.6087086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:19,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43702 samples/s/p 4:32:44 } +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 255/ 1625], loss: 1.192, per_step_time: 1474ms, lr: 2.608283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:22,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42514 samples/s/p 4:33:17 } +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 257/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.607857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43769 samples/s/p 4:32:36 } +2024-07-25 20:36:28,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 259/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.6074307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:28,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.44081 samples/s/p 4:32:24 } +2024-07-25 20:36:31,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 261/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 2.6070044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43103 samples/s/p 4:32:51 } +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 263/ 1625], loss: 1.043, per_step_time: 1473ms, lr: 2.6065778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:34,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42843 samples/s/p 4:32:56 } +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 265/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.6061514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43694 samples/s/p 4:32:27 } +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 267/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.6057243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43667 samples/s/p 4:32:25 } +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 269/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.6052974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44220 samples/s/p 4:32:05 } +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 271/ 1625], loss: 1.017, per_step_time: 1473ms, lr: 2.6048701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:46,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43101 samples/s/p 4:32:36 } +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 273/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.6044425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:49,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43789 samples/s/p 4:32:12 } +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 275/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.6040148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:52,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43686 samples/s/p 4:32:12 } +2024-07-25 20:36:54,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 277/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.6035868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:54,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44201 samples/s/p 4:31:54 } +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 279/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 2.6031588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.42706 samples/s/p 4:32:36 } +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 281/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.6027305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43453 samples/s/p 4:32:11 } +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 283/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.6023019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:03,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43459 samples/s/p 4:32:08 } +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 285/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.6018733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43371 samples/s/p 4:32:07 } +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 287/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.6014444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43086 samples/s/p 4:32:13 } +2024-07-25 20:37:12,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 289/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.6010153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:12,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43965 samples/s/p 4:31:43 } +2024-07-25 20:37:15,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 291/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.600586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43093 samples/s/p 4:32:07 } +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 293/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 2.6001566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43061 samples/s/p 4:32:05 } +2024-07-25 20:37:21,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 295/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.599727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:21,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43588 samples/s/p 4:31:46 } +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 297/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.5992971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43541 samples/s/p 4:31:44 } +2024-07-25 20:37:27,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 299/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.5988671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:27,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43777 samples/s/p 4:31:34 } +2024-07-25 20:37:30,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 301/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.5984367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:30,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43466 samples/s/p 4:31:41 } +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 303/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.5980064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43241 samples/s/p 4:31:45 } +2024-07-25 20:37:36,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 305/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.5975756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:36,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43614 samples/s/p 4:31:30 } +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 307/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 2.5971449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:39,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.42979 samples/s/p 4:31:47 } +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 309/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.596714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43727 samples/s/p 4:31:21 } +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 311/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.5962827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:45,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43971 samples/s/p 4:31:11 } +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 313/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.5958512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43556 samples/s/p 4:31:20 } +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 315/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.5954198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43445 samples/s/p 4:31:21 } +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 317/ 1625], loss: 0.957, per_step_time: 1472ms, lr: 2.594988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:54,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43468 samples/s/p 4:31:17 } +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 319/ 1625], loss: 1.002, per_step_time: 1470ms, lr: 2.594556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43883 samples/s/p 4:31:02 } +2024-07-25 20:37:59,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 321/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 2.594124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:59,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43015 samples/s/p 4:31:25 } +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 323/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 2.5936914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:02,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.44063 samples/s/p 4:30:51 } +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 325/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.5932592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43747 samples/s/p 4:30:57 } +2024-07-25 20:38:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 327/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5928262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:08,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44160 samples/s/p 4:30:42 } +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 329/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.5923935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43431 samples/s/p 4:31:01 } +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 331/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.5919602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43828 samples/s/p 4:30:46 } +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 333/ 1625], loss: 1.221, per_step_time: 1469ms, lr: 2.591527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44498 samples/s/p 4:30:23 } +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 335/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.5910935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:20,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43249 samples/s/p 4:30:57 } +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 337/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.5906598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43713 samples/s/p 4:30:40 } +2024-07-25 20:38:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 339/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.5902258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43638 samples/s/p 4:30:40 } +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 341/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 2.5897916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.42977 samples/s/p 4:30:57 } +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 343/ 1625], loss: 0.974, per_step_time: 1470ms, lr: 2.5893574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:32,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43995 samples/s/p 4:30:23 } +2024-07-25 20:38:35,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 345/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 2.5889229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:35,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43474 samples/s/p 4:30:36 } +2024-07-25 20:38:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 347/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 2.5884883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:38,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43475 samples/s/p 4:30:33 } +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 349/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 2.5880534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43000 samples/s/p 4:30:44 } +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 351/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5876187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43509 samples/s/p 4:30:26 } +2024-07-25 20:38:47,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 353/ 1625], loss: 1.186, per_step_time: 1475ms, lr: 2.5871832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:47,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.42279 samples/s/p 4:31:00 } +2024-07-25 20:38:50,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 355/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.5867479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43321 samples/s/p 4:30:26 } +2024-07-25 20:38:53,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 357/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5863124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:53,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.44075 samples/s/p 4:30:00 } +2024-07-25 20:38:55,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 359/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.5858766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:55,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43620 samples/s/p 4:30:11 } +2024-07-25 20:38:58,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 361/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5854404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:58,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43587 samples/s/p 4:30:09 } +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 363/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.5850044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43542 samples/s/p 4:30:07 } +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 365/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.5845678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43711 samples/s/p 4:29:59 } +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.5841315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43662 samples/s/p 4:29:58 } +2024-07-25 20:39:10,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 369/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.5836945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:10,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44288 samples/s/p 4:29:36 } +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 371/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.5832576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43217 samples/s/p 4:30:05 } +2024-07-25 20:39:16,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 373/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5828205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:16,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43403 samples/s/p 4:29:57 } +2024-07-25 20:39:19,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 375/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.5823832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:19,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43264 samples/s/p 4:29:58 } +2024-07-25 20:39:22,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 377/ 1625], loss: 0.949, per_step_time: 1468ms, lr: 2.5819456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:22,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44643 samples/s/p 4:29:14 } +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 379/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.581508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43054 samples/s/p 4:29:58 } +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 381/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.58107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:28,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43584 samples/s/p 4:29:40 } +2024-07-25 20:39:31,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 383/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.580632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:31,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43225 samples/s/p 4:29:47 } +2024-07-25 20:39:34,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 385/ 1625], loss: 1.238, per_step_time: 1469ms, lr: 2.5801935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:34,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44260 samples/s/p 4:29:14 } +2024-07-25 20:39:37,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 387/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.5797552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:37,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44215 samples/s/p 4:29:12 } +2024-07-25 20:39:40,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 389/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.5793164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:40,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.42274 samples/s/p 4:30:07 } +2024-07-25 20:39:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 391/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.5788773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:43,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43460 samples/s/p 4:29:28 } +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 393/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.5784384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43366 samples/s/p 4:29:28 } +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 395/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.5779993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:49,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43252 samples/s/p 4:29:29 } +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 397/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.5775596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43278 samples/s/p 4:29:25 } +2024-07-25 20:39:55,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 399/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.5771202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:55,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43380 samples/s/p 4:29:19 } +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 401/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5766803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:57,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43146 samples/s/p 4:29:23 } +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 403/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.5762403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43434 samples/s/p 4:29:12 } +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 405/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.5758001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43708 samples/s/p 4:29:01 } +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 407/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 2.57536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42932 samples/s/p 4:29:21 } +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 409/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.5749192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43681 samples/s/p 4:28:55 } +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 411/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.5744786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:12,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43810 samples/s/p 4:28:49 } +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 413/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.5740377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42850 samples/s/p 4:29:14 } +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 415/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.5735966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43885 samples/s/p 4:28:41 } +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 417/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 2.5731553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43715 samples/s/p 4:28:43 } +2024-07-25 20:40:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 419/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5727139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:24,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43740 samples/s/p 4:28:39 } +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 421/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 2.572272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43490 samples/s/p 4:28:43 } +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 423/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.5718302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43129 samples/s/p 4:28:51 } +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 425/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.571388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:33,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43456 samples/s/p 4:28:39 } +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 427/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.5709458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43033 samples/s/p 4:28:48 } +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 429/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.5705032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43639 samples/s/p 4:28:27 } +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 431/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.5700607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.42744 samples/s/p 4:28:51 } +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 433/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.5696178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43665 samples/s/p 4:28:21 } +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 435/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.5691748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43259 samples/s/p 4:28:30 } +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 437/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.5687315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43241 samples/s/p 4:28:27 } +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 439/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.5682884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:54,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43561 samples/s/p 4:28:15 } +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 441/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.5678448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43940 samples/s/p 4:28:01 } +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 443/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.5674008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43833 samples/s/p 4:28:01 } +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 445/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.5669571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43330 samples/s/p 4:28:13 } +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 447/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.5665127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:05,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43611 samples/s/p 4:28:02 } +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 449/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.5660685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43900 samples/s/p 4:27:50 } +2024-07-25 20:41:11,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 451/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.565624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:11,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43399 samples/s/p 4:28:02 } +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 453/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.5651794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43779 samples/s/p 4:27:48 } +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 455/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 2.5647345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43503 samples/s/p 4:27:53 } +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 457/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.5642892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43235 samples/s/p 4:27:58 } +2024-07-25 20:41:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 459/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 2.563844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43936 samples/s/p 4:27:34 } +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 461/ 1625], loss: 1.362, per_step_time: 1472ms, lr: 2.5633986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:26,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43323 samples/s/p 4:27:50 } +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 463/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.562953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43683 samples/s/p 4:27:36 } +2024-07-25 20:41:32,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 465/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 2.5625071e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:32,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.44014 samples/s/p 4:27:23 } +2024-07-25 20:41:35,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 467/ 1625], loss: 1.282, per_step_time: 1469ms, lr: 2.5620611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.44340 samples/s/p 4:27:11 } +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 469/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.561615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:38,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43011 samples/s/p 4:27:47 } +2024-07-25 20:41:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 471/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.5611685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43700 samples/s/p 4:27:24 } +2024-07-25 20:41:44,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 473/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.5607218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:44,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43534 samples/s/p 4:27:26 } +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 475/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.560275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43289 samples/s/p 4:27:30 } +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 477/ 1625], loss: 0.968, per_step_time: 1471ms, lr: 2.5598283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43805 samples/s/p 4:27:12 } +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 479/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.559381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43317 samples/s/p 4:27:23 } +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 481/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 2.5589337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43367 samples/s/p 4:27:19 } +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 483/ 1625], loss: 0.845, per_step_time: 1472ms, lr: 2.5584863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43378 samples/s/p 4:27:15 } +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 485/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 2.5580384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:01,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43397 samples/s/p 4:27:12 } +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 487/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.5575904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43715 samples/s/p 4:27:00 } +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 489/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.5571424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43478 samples/s/p 4:27:04 } +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 491/ 1625], loss: 0.914, per_step_time: 1471ms, lr: 2.5566942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:10,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43809 samples/s/p 4:26:51 } +2024-07-25 20:42:13,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 493/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.5562456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:13,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43651 samples/s/p 4:26:53 } +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 495/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.5557973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43366 samples/s/p 4:26:58 } +2024-07-25 20:42:19,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 497/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 2.5553481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:19,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.44145 samples/s/p 4:26:32 } +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 499/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.5548994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43789 samples/s/p 4:26:40 } +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 501/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.5544505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43517 samples/s/p 4:26:45 } +2024-07-25 20:42:28,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 503/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.554001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:28,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43958 samples/s/p 4:26:29 } +2024-07-25 20:42:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 505/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.5535512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43257 samples/s/p 4:26:47 } +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 507/ 1625], loss: 1.000, per_step_time: 1473ms, lr: 2.5531017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:34,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.42970 samples/s/p 4:26:52 } +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 509/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.5526517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43157 samples/s/p 4:26:44 } +2024-07-25 20:42:40,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 511/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.5522017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:40,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43544 samples/s/p 4:26:29 } +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 513/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.5517515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43407 samples/s/p 4:26:30 } +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 515/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.5513009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43877 samples/s/p 4:26:14 } +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 517/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.5508501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43228 samples/s/p 4:26:30 } +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 519/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5503994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:52,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43460 samples/s/p 4:26:20 } +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 521/ 1625], loss: 1.062, per_step_time: 1483ms, lr: 2.5499483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.39346 samples/s/p 4:28:19 } +2024-07-25 20:42:57,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 523/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.5494972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:57,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43346 samples/s/p 4:26:18 } +2024-07-25 20:43:00,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 525/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.5490457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:00,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43480 samples/s/p 4:26:11 } +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 527/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 2.548594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43010 samples/s/p 4:26:22 } +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 529/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.5481426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43907 samples/s/p 4:25:52 } +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 531/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.5476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:09,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43843 samples/s/p 4:25:51 } +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 533/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.5472384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43857 samples/s/p 4:25:48 } +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 535/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.5467862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43974 samples/s/p 4:25:41 } +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 537/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.5463336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43524 samples/s/p 4:25:52 } +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 539/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.5458809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43697 samples/s/p 4:25:44 } +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 541/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.545428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43354 samples/s/p 4:25:51 } +2024-07-25 20:43:27,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 543/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.544975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43893 samples/s/p 4:25:32 } +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 545/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 2.5445217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42849 samples/s/p 4:26:00 } +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 547/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.5440682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43320 samples/s/p 4:25:43 } +2024-07-25 20:43:36,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 549/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.5436146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43009 samples/s/p 4:25:49 } +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 551/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.543161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43618 samples/s/p 4:25:28 } +2024-07-25 20:43:42,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 553/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.5427067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43146 samples/s/p 4:25:39 } +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 555/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.5422527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43788 samples/s/p 4:25:17 } +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 557/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.5417983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43647 samples/s/p 4:25:19 } +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 559/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.5413437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:51,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43065 samples/s/p 4:25:33 } +2024-07-25 20:43:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 561/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 2.540889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:54,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44380 samples/s/p 4:24:51 } +2024-07-25 20:43:57,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 563/ 1625], loss: 1.052, per_step_time: 1474ms, lr: 2.540434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:57,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42699 samples/s/p 4:25:38 } +2024-07-25 20:43:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 565/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5399791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:59,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43329 samples/s/p 4:25:16 } +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 567/ 1625], loss: 1.009, per_step_time: 1473ms, lr: 2.5395238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42903 samples/s/p 4:25:26 } +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 569/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.5390684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43485 samples/s/p 4:25:06 } +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 571/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.5386127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44048 samples/s/p 4:24:46 } +2024-07-25 20:44:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 573/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.5381569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:11,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43581 samples/s/p 4:24:57 } +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 575/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.5377009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43337 samples/s/p 4:25:01 } +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 577/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5372448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43854 samples/s/p 4:24:43 } +2024-07-25 20:44:20,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 579/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.5367885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:20,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43937 samples/s/p 4:24:38 } +2024-07-25 20:44:23,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 581/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.5363319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:23,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43508 samples/s/p 4:24:47 } +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 583/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.5358753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43398 samples/s/p 4:24:48 } +2024-07-25 20:44:29,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 585/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.5354186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:29,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43600 samples/s/p 4:24:39 } +2024-07-25 20:44:32,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 587/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.5349613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:32,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43312 samples/s/p 4:24:44 } +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 589/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5345042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43185 samples/s/p 4:24:45 } +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 591/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5340469e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43180 samples/s/p 4:24:42 } +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 593/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.533589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.42914 samples/s/p 4:24:47 } +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 595/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.5331314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43261 samples/s/p 4:24:34 } +2024-07-25 20:44:47,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 597/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5326734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:47,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43988 samples/s/p 4:24:10 } +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 599/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5322151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43346 samples/s/p 4:24:26 } +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 601/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.5317566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.44035 samples/s/p 4:24:03 } +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 603/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.531298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:56,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.44018 samples/s/p 4:24:00 } +2024-07-25 20:44:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 605/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.5308394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:58,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43467 samples/s/p 4:24:13 } +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 607/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.5303805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:01,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43693 samples/s/p 4:24:04 } +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 609/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.5299214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43929 samples/s/p 4:23:54 } +2024-07-25 20:45:07,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 611/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.5294623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:07,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43544 samples/s/p 4:24:02 } +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 613/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.5290028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43284 samples/s/p 4:24:07 } +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 615/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 2.5285432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43904 samples/s/p 4:23:46 } +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 617/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.5280837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44045 samples/s/p 4:23:39 } +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.5276235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:19,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43547 samples/s/p 4:23:50 } +2024-07-25 20:45:22,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 621/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.527163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:22,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44087 samples/s/p 4:23:32 } +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 623/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.526703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44286 samples/s/p 4:23:23 } +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 625/ 1625], loss: 1.311, per_step_time: 1469ms, lr: 2.5262425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44500 samples/s/p 4:23:14 } +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 627/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.525782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:31,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43775 samples/s/p 4:23:32 } +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 629/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.525321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42793 samples/s/p 4:23:58 } +2024-07-25 20:45:37,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 631/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.52486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:37,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43576 samples/s/p 4:23:32 } +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 633/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 2.5243986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43019 samples/s/p 4:23:45 } +2024-07-25 20:45:43,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 635/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.5239373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43881 samples/s/p 4:23:17 } +2024-07-25 20:45:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 637/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 2.5234756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:46,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43893 samples/s/p 4:23:14 } +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 639/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.523014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.44068 samples/s/p 4:23:06 } +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 641/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 2.522552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42697 samples/s/p 4:23:43 } +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 643/ 1625], loss: 0.997, per_step_time: 1473ms, lr: 2.5220897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.42967 samples/s/p 4:23:32 } +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 645/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.5216274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43052 samples/s/p 4:23:26 } +2024-07-25 20:46:00,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 647/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.521165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:00,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43373 samples/s/p 4:23:14 } +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 649/ 1625], loss: 1.322, per_step_time: 1472ms, lr: 2.5207022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43255 samples/s/p 4:23:15 } +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 651/ 1625], loss: 1.077, per_step_time: 1470ms, lr: 2.5202393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.43972 samples/s/p 4:22:51 } +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 653/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.5197764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.42996 samples/s/p 4:23:16 } +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 655/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 2.519313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44034 samples/s/p 4:22:43 } +2024-07-25 20:46:15,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 657/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.5188498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44096 samples/s/p 4:22:38 } +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 659/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.5183861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:18,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43513 samples/s/p 4:22:52 } +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 661/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5179223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43544 samples/s/p 4:22:49 } +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 663/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.5174584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.44065 samples/s/p 4:22:31 } +2024-07-25 20:46:27,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 665/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.5169942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.44131 samples/s/p 4:22:26 } +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 667/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.51653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43498 samples/s/p 4:22:41 } +2024-07-25 20:46:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 669/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.5160656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43125 samples/s/p 4:22:49 } +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 671/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.5156009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.42813 samples/s/p 4:22:55 } +2024-07-25 20:46:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 673/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.5151363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43392 samples/s/p 4:22:35 } +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 675/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.5146714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43990 samples/s/p 4:22:15 } +2024-07-25 20:46:45,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 677/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.514206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:45,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43780 samples/s/p 4:22:18 } +2024-07-25 20:46:48,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 679/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.5137408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:48,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42935 samples/s/p 4:22:40 } +2024-07-25 20:46:51,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 681/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.5132751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:51,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43830 samples/s/p 4:22:11 } +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 683/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.5128094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42811 samples/s/p 4:22:37 } +2024-07-25 20:46:56,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 685/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.5123436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:56,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43266 samples/s/p 4:22:21 } +2024-07-25 20:46:59,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 687/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.5118774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:59,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43188 samples/s/p 4:22:21 } +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 689/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.5114114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:02,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.44059 samples/s/p 4:21:52 } +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 691/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.510945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43527 samples/s/p 4:22:05 } +2024-07-25 20:47:08,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 693/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.5104782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:08,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43431 samples/s/p 4:22:05 } +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 695/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.5100115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:11,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43116 samples/s/p 4:22:11 } +2024-07-25 20:47:14,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 697/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.5095445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:14,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43650 samples/s/p 4:21:53 } +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 699/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.5090774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43671 samples/s/p 4:21:49 } +2024-07-25 20:47:20,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 701/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.50861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:20,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43519 samples/s/p 4:21:50 } +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 703/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.5081426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43957 samples/s/p 4:21:35 } +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 705/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.5076748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43641 samples/s/p 4:21:41 } +2024-07-25 20:47:29,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 707/ 1625], loss: 0.862, per_step_time: 1472ms, lr: 2.5072073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43262 samples/s/p 4:21:49 } +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 709/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.5067391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42684 samples/s/p 4:22:03 } +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 711/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 2.506271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:35,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43909 samples/s/p 4:21:24 } +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 713/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.5058027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42970 samples/s/p 4:21:49 } +2024-07-25 20:47:41,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 715/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.5053341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:41,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43395 samples/s/p 4:21:33 } +2024-07-25 20:47:44,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 717/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.5048654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:44,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43721 samples/s/p 4:21:21 } +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 719/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5043966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:47,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43100 samples/s/p 4:21:36 } +2024-07-25 20:47:50,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 721/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.5039275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43264 samples/s/p 4:21:28 } +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 723/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5034584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43195 samples/s/p 4:21:27 } +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 725/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.5029889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.42985 samples/s/p 4:21:31 } +2024-07-25 20:47:56,025 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 727/ 1625], loss: 1.002, per_step_time: 1470ms, lr: 2.5025192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:31,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.44119 samples/s/p 4:20:55 } +2024-07-25 20:48:34,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 729/ 1625], loss: 0.904, per_step_time: 1472ms, lr: 2.5020494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:34,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43458 samples/s/p 4:21:11 } +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 731/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 2.5015794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.44099 samples/s/p 4:20:50 } +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 733/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.5011092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43516 samples/s/p 4:21:03 } +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 735/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.5006391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:42,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43596 samples/s/p 4:20:58 } +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 737/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.5001686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43498 samples/s/p 4:20:58 } +2024-07-25 20:48:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 739/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.4996976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43646 samples/s/p 4:20:51 } +2024-07-25 20:48:51,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 741/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.499227e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43302 samples/s/p 4:20:58 } +2024-07-25 20:48:54,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 743/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 2.498756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:54,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43994 samples/s/p 4:20:35 } +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 745/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.4982848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:57,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43129 samples/s/p 4:20:57 } +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 747/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 2.4978135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:00,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43968 samples/s/p 4:20:30 } +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 749/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.4973418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43692 samples/s/p 4:20:35 } +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 751/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.4968702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43870 samples/s/p 4:20:27 } +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 753/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.4963983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43029 samples/s/p 4:20:48 } +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 755/ 1625], loss: 0.919, per_step_time: 1471ms, lr: 2.4959261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43650 samples/s/p 4:20:27 } +2024-07-25 20:49:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 757/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.495454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:15,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.42825 samples/s/p 4:20:48 } +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 759/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.4949815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43772 samples/s/p 4:20:18 } +2024-07-25 20:49:21,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 761/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.4945093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:21,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44094 samples/s/p 4:20:06 } +2024-07-25 20:49:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 763/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4940364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:25,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43730 samples/s/p 4:20:13 } +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 765/ 1625], loss: 1.161, per_step_time: 1468ms, lr: 2.4935633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44602 samples/s/p 4:19:45 } +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 767/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.4930905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43664 samples/s/p 4:20:09 } +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 769/ 1625], loss: 1.214, per_step_time: 1470ms, lr: 2.4926172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44065 samples/s/p 4:19:55 } +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 771/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.4921437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:36,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43472 samples/s/p 4:20:09 } +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 773/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.49167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43566 samples/s/p 4:20:03 } +2024-07-25 20:49:42,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 775/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.4911962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:42,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43360 samples/s/p 4:20:06 } +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 777/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.4907225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:45,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43773 samples/s/p 4:19:51 } +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 779/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.4902482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43371 samples/s/p 4:20:00 } +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 781/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.4897738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43617 samples/s/p 4:19:50 } +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 783/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.4892994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:54,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43693 samples/s/p 4:19:45 } +2024-07-25 20:49:57,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 785/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.4888246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:57,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.44083 samples/s/p 4:19:31 } +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 787/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.4883499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43081 samples/s/p 4:19:56 } +2024-07-25 20:50:03,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 789/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 2.4878751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:03,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44108 samples/s/p 4:19:24 } +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 791/ 1625], loss: 1.425, per_step_time: 1471ms, lr: 2.4873994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:06,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43717 samples/s/p 4:19:32 } +2024-07-25 20:50:09,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 793/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4869241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:09,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.42979 samples/s/p 4:19:51 } +2024-07-25 20:50:12,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 795/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.486449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:12,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43878 samples/s/p 4:19:22 } +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 797/ 1625], loss: 1.012, per_step_time: 1863ms, lr: 2.4859732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:16,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 4.29193 samples/s/p 5:28:36 } +2024-07-25 20:50:18,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 799/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.4854971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:18,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44262 samples/s/p 4:19:05 } +2024-07-25 20:50:21,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 801/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 2.4850215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:21,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43589 samples/s/p 4:19:21 } +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 803/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.484545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43349 samples/s/p 4:19:25 } +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 805/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.4840687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:27,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43616 samples/s/p 4:19:15 } +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 807/ 1625], loss: 1.324, per_step_time: 1474ms, lr: 2.4835923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42599 samples/s/p 4:19:41 } +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 809/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 2.4831155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42949 samples/s/p 4:19:28 } +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 811/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.4826384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42749 samples/s/p 4:19:31 } +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 813/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4821613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42796 samples/s/p 4:19:26 } +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 815/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.4816842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43615 samples/s/p 4:19:00 } +2024-07-25 20:50:45,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 817/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.4812067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:45,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42814 samples/s/p 4:19:20 } +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 819/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.480729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43406 samples/s/p 4:19:00 } +2024-07-25 20:50:51,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 821/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.4802514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:51,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43545 samples/s/p 4:18:53 } +2024-07-25 20:50:54,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 823/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 2.4797733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:54,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43828 samples/s/p 4:18:42 } +2024-07-25 20:50:57,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 825/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.4792951e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:57,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43123 samples/s/p 4:18:59 } +2024-07-25 20:51:00,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 827/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.478817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:00,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43941 samples/s/p 4:18:33 } +2024-07-25 20:51:03,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 829/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 2.4783385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:03,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.42920 samples/s/p 4:18:59 } +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 831/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.4778597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:06,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43326 samples/s/p 4:18:45 } +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 833/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.477381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:09,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43252 samples/s/p 4:18:44 } +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 835/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 2.476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43311 samples/s/p 4:18:39 } +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 837/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.476423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43657 samples/s/p 4:18:26 } +2024-07-25 20:51:18,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 839/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 2.4759434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:18,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43743 samples/s/p 4:18:21 } +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 841/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.4754641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43572 samples/s/p 4:18:23 } +2024-07-25 20:51:23,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 843/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.4749845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:23,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43536 samples/s/p 4:18:21 } +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 845/ 1625], loss: 1.298, per_step_time: 1473ms, lr: 2.474505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42777 samples/s/p 4:18:40 } +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 847/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.4740246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43556 samples/s/p 4:18:14 } +2024-07-25 20:51:32,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 849/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4735444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:32,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.44080 samples/s/p 4:17:57 } +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 851/ 1625], loss: 1.151, per_step_time: 1474ms, lr: 2.4730645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42698 samples/s/p 4:18:33 } +2024-07-25 20:51:38,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 853/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.472584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:38,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42973 samples/s/p 4:18:22 } +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 855/ 1625], loss: 0.942, per_step_time: 1470ms, lr: 2.472103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43910 samples/s/p 4:17:53 } +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 857/ 1625], loss: 1.369, per_step_time: 1470ms, lr: 2.4716222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43938 samples/s/p 4:17:49 } +2024-07-25 20:51:47,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 859/ 1625], loss: 1.313, per_step_time: 1470ms, lr: 2.4711413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43955 samples/s/p 4:17:45 } +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 861/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.47066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43574 samples/s/p 4:17:53 } +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 863/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.4701789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:53,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43428 samples/s/p 4:17:55 } +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 865/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.4696972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:56,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43622 samples/s/p 4:17:46 } +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 867/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 2.4692155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43696 samples/s/p 4:17:41 } +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 869/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.4687335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43558 samples/s/p 4:17:42 } +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 871/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.4682515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43134 samples/s/p 4:17:51 } +2024-07-25 20:52:08,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 873/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.4677693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:08,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43243 samples/s/p 4:17:45 } +2024-07-25 20:52:11,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 875/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.467287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:11,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43284 samples/s/p 4:17:41 } +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 877/ 1625], loss: 1.386, per_step_time: 1473ms, lr: 2.4668043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43048 samples/s/p 4:17:45 } +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 879/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.4663217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42940 samples/s/p 4:17:45 } +2024-07-25 20:52:19,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 881/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.4658388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.44198 samples/s/p 4:17:06 } +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 883/ 1625], loss: 1.088, per_step_time: 1475ms, lr: 2.4653558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42344 samples/s/p 4:17:56 } +2024-07-25 20:52:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 885/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 2.4648729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43563 samples/s/p 4:17:18 } +2024-07-25 20:52:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 887/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.4643892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:28,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43271 samples/s/p 4:17:24 } +2024-07-25 20:52:31,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 889/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.463906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:31,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42956 samples/s/p 4:17:30 } +2024-07-25 20:52:34,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 891/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.4634222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:34,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43631 samples/s/p 4:17:08 } +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 893/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.4629384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43939 samples/s/p 4:16:56 } +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 895/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.4624542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43731 samples/s/p 4:16:59 } +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 897/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.46197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42929 samples/s/p 4:17:19 } +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 899/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.4614856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43498 samples/s/p 4:17:00 } +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 901/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.461001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43266 samples/s/p 4:17:03 } +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 903/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.4605162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:52,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43043 samples/s/p 4:17:07 } +2024-07-25 20:52:55,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 905/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.4600313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:55,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43311 samples/s/p 4:16:56 } +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 907/ 1625], loss: 1.172, per_step_time: 1483ms, lr: 2.4595463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.39190 samples/s/p 4:18:51 } +2024-07-25 20:53:01,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 909/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.4590609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:01,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43588 samples/s/p 4:16:42 } +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 911/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.4585755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43070 samples/s/p 4:16:54 } +2024-07-25 20:53:07,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 913/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.45809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:07,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43355 samples/s/p 4:16:43 } +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 915/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.4576042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43614 samples/s/p 4:16:33 } +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 917/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.4571184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:13,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43257 samples/s/p 4:16:40 } +2024-07-25 20:53:16,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 919/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.4566321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:16,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43061 samples/s/p 4:16:43 } +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 921/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.456146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43401 samples/s/p 4:16:30 } +2024-07-25 20:53:22,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 923/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.4556595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:22,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43563 samples/s/p 4:16:22 } +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 925/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4551731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43595 samples/s/p 4:16:19 } +2024-07-25 20:53:27,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 927/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.4546864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:27,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43753 samples/s/p 4:16:11 } +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 929/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.4541992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43902 samples/s/p 4:16:04 } +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 931/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.4537121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.44230 samples/s/p 4:15:52 } +2024-07-25 20:53:36,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 933/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.453225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:36,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43815 samples/s/p 4:16:01 } +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 935/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.4527375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:39,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43510 samples/s/p 4:16:06 } +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 937/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.45225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43374 samples/s/p 4:16:07 } +2024-07-25 20:53:45,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 939/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4517623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:45,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43398 samples/s/p 4:16:04 } +2024-07-25 20:53:48,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 941/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.4512745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:48,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43671 samples/s/p 4:15:53 } +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 943/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.450786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:51,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43939 samples/s/p 4:15:42 } +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 945/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4502982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:54,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43289 samples/s/p 4:15:58 } +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 947/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.4498098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:57,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43808 samples/s/p 4:15:40 } +2024-07-25 20:54:00,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 949/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.449321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:00,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43313 samples/s/p 4:15:51 } +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 951/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.4488325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:03,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43264 samples/s/p 4:15:50 } +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 953/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.4483435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43522 samples/s/p 4:15:39 } +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 955/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.4478544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43351 samples/s/p 4:15:41 } +2024-07-25 20:54:12,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 957/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4473653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43751 samples/s/p 4:15:27 } +2024-07-25 20:54:15,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 959/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.4468758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:15,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43857 samples/s/p 4:15:21 } +2024-07-25 20:54:18,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 961/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.4463863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:18,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43296 samples/s/p 4:15:34 } +2024-07-25 20:54:21,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.4458963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:21,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43119 samples/s/p 4:15:36 } +2024-07-25 20:54:23,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 965/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.4454064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:23,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.42985 samples/s/p 4:15:37 } +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 967/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.4449166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42853 samples/s/p 4:15:38 } +2024-07-25 20:54:29,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 969/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.444426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:29,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43251 samples/s/p 4:15:24 } +2024-07-25 20:54:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 971/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.443936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:32,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43467 samples/s/p 4:15:15 } +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 973/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.4434456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42831 samples/s/p 4:15:29 } +2024-07-25 20:54:38,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 975/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.4429548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:38,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43767 samples/s/p 4:15:00 } +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 977/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.4424635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44180 samples/s/p 4:14:46 } +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 979/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.4419727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43117 samples/s/p 4:15:13 } +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 981/ 1625], loss: 1.095, per_step_time: 1469ms, lr: 2.4414816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:47,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44339 samples/s/p 4:14:35 } +2024-07-25 20:54:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 983/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.4409901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44009 samples/s/p 4:14:42 } +2024-07-25 20:54:53,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 985/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.4404984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43641 samples/s/p 4:14:49 } +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 987/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.440007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43381 samples/s/p 4:14:53 } +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 989/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.4395149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:59,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43472 samples/s/p 4:14:48 } +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 991/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.4390229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43699 samples/s/p 4:14:39 } +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 993/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.4385306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43655 samples/s/p 4:14:37 } +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 995/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.4380382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43241 samples/s/p 4:14:46 } +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 997/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4375458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43339 samples/s/p 4:14:40 } +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 999/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 2.437053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:14,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.42677 samples/s/p 4:14:56 } +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1001/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4365601e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:17,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43330 samples/s/p 4:14:34 } +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1003/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 2.4360672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43532 samples/s/p 4:14:26 } +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1005/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.4355739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43318 samples/s/p 4:14:29 } +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1007/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.4350806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43478 samples/s/p 4:14:21 } +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1009/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.434587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43111 samples/s/p 4:14:29 } +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1011/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 2.4340932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:31,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43946 samples/s/p 4:14:02 } +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1013/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.4335995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.42674 samples/s/p 4:14:35 } +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1015/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.4331055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43481 samples/s/p 4:14:09 } +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1017/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.4326111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:40,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43602 samples/s/p 4:14:03 } +2024-07-25 20:55:43,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1019/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.432117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43221 samples/s/p 4:14:11 } +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1021/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.4316225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43189 samples/s/p 4:14:09 } +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1023/ 1625], loss: 1.379, per_step_time: 1470ms, lr: 2.431128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:49,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43921 samples/s/p 4:13:45 } +2024-07-25 20:55:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1025/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.4306331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:52,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43536 samples/s/p 4:13:53 } +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1027/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 2.430138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:55,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43343 samples/s/p 4:13:56 } +2024-07-25 20:55:58,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1029/ 1625], loss: 1.533, per_step_time: 1471ms, lr: 2.4296429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:58,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43482 samples/s/p 4:13:49 } +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1031/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.4291478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43595 samples/s/p 4:13:43 } +2024-07-25 20:56:04,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1033/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.428652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:04,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43541 samples/s/p 4:13:41 } +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1035/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.4281568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43833 samples/s/p 4:13:30 } +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1037/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.427661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43660 samples/s/p 4:13:32 } +2024-07-25 20:56:13,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1039/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.4271649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:13,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42794 samples/s/p 4:13:53 } +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1041/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.4266688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42861 samples/s/p 4:13:48 } +2024-07-25 20:56:19,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1043/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 2.4261724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43685 samples/s/p 4:13:22 } +2024-07-25 20:56:22,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1045/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.425676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:22,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43950 samples/s/p 4:13:12 } +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1047/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.4251794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42896 samples/s/p 4:13:39 } +2024-07-25 20:56:27,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1049/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4246825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:27,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43955 samples/s/p 4:13:06 } +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1051/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.4241855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:30,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43225 samples/s/p 4:13:24 } +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1053/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 2.4236884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43581 samples/s/p 4:13:11 } +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1055/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.4231913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:36,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43583 samples/s/p 4:13:08 } +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1057/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.422694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:39,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43681 samples/s/p 4:13:02 } +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1059/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.4221965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43516 samples/s/p 4:13:04 } +2024-07-25 20:56:45,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1061/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.421699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:45,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43639 samples/s/p 4:12:57 } +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1063/ 1625], loss: 1.396, per_step_time: 1471ms, lr: 2.421201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43775 samples/s/p 4:12:50 } +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1065/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4207025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43247 samples/s/p 4:13:02 } +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1067/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.4202047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43285 samples/s/p 4:12:58 } +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1069/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.4197063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43895 samples/s/p 4:12:38 } +2024-07-25 20:57:00,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1071/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.4192077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:00,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43724 samples/s/p 4:12:40 } +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1073/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 2.418709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:03,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43921 samples/s/p 4:12:32 } +2024-07-25 20:57:06,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1075/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.4182102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:06,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43400 samples/s/p 4:12:43 } +2024-07-25 20:57:09,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1077/ 1625], loss: 1.091, per_step_time: 1482ms, lr: 2.4177112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.39512 samples/s/p 4:14:30 } +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1079/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.417212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43474 samples/s/p 4:12:35 } +2024-07-25 20:57:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1081/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 2.4167124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:15,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44122 samples/s/p 4:12:14 } +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1083/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4162131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43952 samples/s/p 4:12:16 } +2024-07-25 20:57:21,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1085/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.4157134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:21,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44186 samples/s/p 4:12:07 } +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1087/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.4152136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:24,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43684 samples/s/p 4:12:18 } +2024-07-25 20:57:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1089/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.4147135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43235 samples/s/p 4:12:27 } +2024-07-25 20:57:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1091/ 1625], loss: 0.914, per_step_time: 1472ms, lr: 2.4142133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43241 samples/s/p 4:12:24 } +2024-07-25 20:57:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1093/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.413713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43297 samples/s/p 4:12:20 } +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1095/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.4132125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:35,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43755 samples/s/p 4:12:04 } +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1097/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 2.412712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43529 samples/s/p 4:12:07 } +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1099/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.4122113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43321 samples/s/p 4:12:10 } +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1101/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.4117102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.44038 samples/s/p 4:11:47 } +2024-07-25 20:57:47,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1103/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 2.4112092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:47,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43810 samples/s/p 4:11:51 } +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1105/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.410708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.42999 samples/s/p 4:12:10 } +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1107/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 2.4102066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.44230 samples/s/p 4:11:33 } +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1109/ 1625], loss: 1.166, per_step_time: 1475ms, lr: 2.409705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:56,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.42327 samples/s/p 4:12:23 } +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1111/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.4092036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43346 samples/s/p 4:11:52 } +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1113/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.4087014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43713 samples/s/p 4:11:39 } +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1115/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.4081994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43614 samples/s/p 4:11:38 } +2024-07-25 20:58:08,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1117/ 1625], loss: 1.232, per_step_time: 1484ms, lr: 2.4076973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:08,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.39061 samples/s/p 4:13:43 } +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1119/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.407195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43056 samples/s/p 4:11:48 } +2024-07-25 20:58:14,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1121/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4066921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:14,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43312 samples/s/p 4:11:38 } +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1123/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 2.40619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43018 samples/s/p 4:11:43 } +2024-07-25 20:58:20,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1125/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.4056868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:20,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.42891 samples/s/p 4:11:44 } +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1127/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.4051838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43582 samples/s/p 4:11:22 } +2024-07-25 20:58:26,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1129/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.4046809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:26,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.44139 samples/s/p 4:11:03 } +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1131/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.4041776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:28,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43675 samples/s/p 4:11:13 } +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1133/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.4036739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43591 samples/s/p 4:11:13 } +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1135/ 1625], loss: 1.205, per_step_time: 1469ms, lr: 2.4031702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.44268 samples/s/p 4:10:51 } +2024-07-25 20:58:37,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1137/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4026664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:37,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43945 samples/s/p 4:10:57 } +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1139/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.4021625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43985 samples/s/p 4:10:53 } +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1141/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.4016585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43776 samples/s/p 4:10:56 } +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1143/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.4011542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43297 samples/s/p 4:11:06 } +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1145/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.40065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:49,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43808 samples/s/p 4:10:49 } +2024-07-25 20:58:52,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1147/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.4001452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43406 samples/s/p 4:10:57 } +2024-07-25 20:58:55,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1149/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.3996405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:55,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43684 samples/s/p 4:10:46 } +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1151/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.3991359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43137 samples/s/p 4:10:59 } +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1153/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 2.3986307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.44059 samples/s/p 4:10:30 } +2024-07-25 20:59:04,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1155/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3981253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:04,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43355 samples/s/p 4:10:47 } +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1157/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.3976201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43228 samples/s/p 4:10:47 } +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1159/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.3971146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43921 samples/s/p 4:10:25 } +2024-07-25 20:59:13,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1161/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.3966091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:13,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43150 samples/s/p 4:10:44 } +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1163/ 1625], loss: 0.920, per_step_time: 1473ms, lr: 2.396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:16,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43082 samples/s/p 4:10:43 } +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1165/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.3955972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:19,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43501 samples/s/p 4:10:28 } +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1167/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.3950912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43767 samples/s/p 4:10:18 } +2024-07-25 20:59:25,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1169/ 1625], loss: 0.966, per_step_time: 1470ms, lr: 2.3945848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:25,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44117 samples/s/p 4:10:05 } +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1171/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.3940784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44081 samples/s/p 4:10:03 } +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1173/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.3935718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43740 samples/s/p 4:10:10 } +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1175/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.393065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43467 samples/s/p 4:10:14 } +2024-07-25 20:59:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1177/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.3925579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43920 samples/s/p 4:09:59 } +2024-07-25 20:59:39,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1179/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.392051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:39,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43312 samples/s/p 4:10:13 } +2024-07-25 20:59:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1181/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3915436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43498 samples/s/p 4:10:05 } +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1183/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 2.3910365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:45,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42998 samples/s/p 4:10:15 } +2024-07-25 20:59:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1185/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.3905288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:48,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43808 samples/s/p 4:09:50 } +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1187/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.3900211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43895 samples/s/p 4:09:45 } +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1189/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.3895132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43980 samples/s/p 4:09:39 } +2024-07-25 20:59:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1191/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.3890052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42841 samples/s/p 4:10:08 } +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1193/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.3884972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43593 samples/s/p 4:09:44 } +2024-07-25 21:00:03,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1195/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 2.3879888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:03,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43866 samples/s/p 4:09:34 } +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1197/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.3874802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43585 samples/s/p 4:09:39 } +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1199/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.3869716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43573 samples/s/p 4:09:36 } +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1201/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.3864632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:12,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43214 samples/s/p 4:09:43 } +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1203/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3859538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:15,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43677 samples/s/p 4:09:27 } +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1205/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.3854449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43582 samples/s/p 4:09:27 } +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1207/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.3849358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43500 samples/s/p 4:09:26 } +2024-07-25 21:00:24,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1209/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.3844266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43649 samples/s/p 4:09:19 } +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1211/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.3839166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43778 samples/s/p 4:09:13 } +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1213/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.3834073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43165 samples/s/p 4:09:27 } +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1215/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.3828976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43520 samples/s/p 4:09:14 } +2024-07-25 21:00:35,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1217/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.3823872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:35,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43398 samples/s/p 4:09:14 } +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1219/ 1625], loss: 1.324, per_step_time: 1470ms, lr: 2.3818773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:38,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.44132 samples/s/p 4:08:51 } +2024-07-25 21:00:41,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1221/ 1625], loss: 1.435, per_step_time: 1473ms, lr: 2.3813669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:41,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43077 samples/s/p 4:09:17 } +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1223/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.3808565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43984 samples/s/p 4:08:49 } +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1225/ 1625], loss: 1.394, per_step_time: 1472ms, lr: 2.3803459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43315 samples/s/p 4:09:05 } +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1227/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.3798351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:50,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44162 samples/s/p 4:08:39 } +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1229/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.379324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43450 samples/s/p 4:08:55 } +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1231/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.378813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43524 samples/s/p 4:08:50 } +2024-07-25 21:00:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1233/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.3783017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43964 samples/s/p 4:08:35 } +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1235/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.3777904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43929 samples/s/p 4:08:33 } +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1237/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.3772787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44052 samples/s/p 4:08:27 } +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1239/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.3767674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44272 samples/s/p 4:08:18 } +2024-07-25 21:01:11,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1241/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.3762554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:11,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43726 samples/s/p 4:08:30 } +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.3757435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43520 samples/s/p 4:08:33 } +2024-07-25 21:01:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3752315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:17,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43035 samples/s/p 4:08:43 } +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1247/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.374719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42768 samples/s/p 4:08:47 } +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1249/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.3742066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43280 samples/s/p 4:08:30 } +2024-07-25 21:01:25,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1251/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.373694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:25,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44134 samples/s/p 4:08:04 } +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1253/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 2.3731813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43474 samples/s/p 4:08:19 } +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1255/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 2.3726683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44386 samples/s/p 4:07:51 } +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1257/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.3721554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43708 samples/s/p 4:08:07 } +2024-07-25 21:01:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1259/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.371642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43555 samples/s/p 4:08:08 } +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.3711285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:40,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43925 samples/s/p 4:07:55 } +2024-07-25 21:01:43,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1263/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.3706152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:43,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43255 samples/s/p 4:08:10 } +2024-07-25 21:01:46,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1265/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.3701015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:46,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43319 samples/s/p 4:08:06 } +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1267/ 1625], loss: 1.050, per_step_time: 1474ms, lr: 2.3695877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.42471 samples/s/p 4:08:26 } +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1269/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.3690738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43463 samples/s/p 4:07:56 } +2024-07-25 21:01:55,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1271/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3685594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:55,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43365 samples/s/p 4:07:56 } +2024-07-25 21:01:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1273/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.3680452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:58,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43222 samples/s/p 4:07:57 } +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1275/ 1625], loss: 0.887, per_step_time: 1470ms, lr: 2.3675308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.44157 samples/s/p 4:07:28 } +2024-07-25 21:02:04,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1277/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.3670162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:04,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43021 samples/s/p 4:07:56 } +2024-07-25 21:02:07,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1279/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.3665016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:07,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43894 samples/s/p 4:07:29 } +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1281/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 2.3659866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:10,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43739 samples/s/p 4:07:31 } +2024-07-25 21:02:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1283/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.3654715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43310 samples/s/p 4:07:40 } +2024-07-25 21:02:16,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1285/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.3649563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43938 samples/s/p 4:07:19 } +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1287/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 2.364441e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:19,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43329 samples/s/p 4:07:33 } +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1289/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.3639259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43615 samples/s/p 4:07:22 } +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1291/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.36341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:25,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43820 samples/s/p 4:07:14 } +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1293/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.3628942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43994 samples/s/p 4:07:06 } +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1295/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.3623785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43696 samples/s/p 4:07:11 } +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1297/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.3618622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43428 samples/s/p 4:07:16 } +2024-07-25 21:02:36,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1299/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.3613458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:36,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43410 samples/s/p 4:07:13 } +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1301/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.3608296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43207 samples/s/p 4:07:16 } +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1303/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.3603132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:42,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43339 samples/s/p 4:07:09 } +2024-07-25 21:02:45,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1305/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.3597966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43235 samples/s/p 4:07:09 } +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1307/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.3592798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:48,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.42932 samples/s/p 4:07:15 } +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1309/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.3587627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43339 samples/s/p 4:07:00 } +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1311/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.3582457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:54,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43261 samples/s/p 4:07:00 } +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1313/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.3577282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43069 samples/s/p 4:07:02 } +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.3572107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43697 samples/s/p 4:06:42 } +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1317/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3566932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:03,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43382 samples/s/p 4:06:48 } +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1319/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 2.3561757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.42951 samples/s/p 4:06:56 } +2024-07-25 21:03:09,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1321/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3556577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:09,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43724 samples/s/p 4:06:32 } +2024-07-25 21:03:12,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1323/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.35514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:12,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43402 samples/s/p 4:06:38 } +2024-07-25 21:03:15,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1325/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.3546214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:15,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43558 samples/s/p 4:06:31 } +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1327/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 2.3541032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:18,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.42451 samples/s/p 4:06:58 } +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1329/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.353585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43345 samples/s/p 4:06:31 } +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1331/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.3530665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:24,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43855 samples/s/p 4:06:14 } +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1333/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.3525474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43944 samples/s/p 4:06:09 } +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1335/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3520286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43351 samples/s/p 4:06:22 } +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1337/ 1625], loss: 1.373, per_step_time: 1471ms, lr: 2.3515096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:32,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43573 samples/s/p 4:06:13 } +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1339/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.3509905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43378 samples/s/p 4:06:15 } +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1341/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.350471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:38,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43678 samples/s/p 4:06:04 } +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1343/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.3499517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43623 samples/s/p 4:06:03 } +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1345/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 2.3494318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:44,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.42358 samples/s/p 4:06:34 } +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1347/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.3489121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:47,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.44021 samples/s/p 4:05:46 } +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1349/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.348392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:50,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43157 samples/s/p 4:06:07 } +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1351/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.347872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43450 samples/s/p 4:05:56 } +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1353/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.3473518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.44047 samples/s/p 4:05:36 } +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1355/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 2.3468312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43239 samples/s/p 4:05:55 } +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1357/ 1625], loss: 1.483, per_step_time: 1471ms, lr: 2.346311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43539 samples/s/p 4:05:44 } +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1359/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3457902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43313 samples/s/p 4:05:48 } +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1361/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.3452694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:08,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43638 samples/s/p 4:05:36 } +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1363/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.3447485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43595 samples/s/p 4:05:34 } +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1365/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.3442273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:14,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43617 samples/s/p 4:05:30 } +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1367/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.343706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:17,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43111 samples/s/p 4:05:41 } +2024-07-25 21:04:20,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1369/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.3431845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:20,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.42846 samples/s/p 4:05:45 } +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1371/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.342663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43347 samples/s/p 4:05:29 } +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1373/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.3421413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:26,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43211 samples/s/p 4:05:30 } +2024-07-25 21:04:28,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1375/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 2.3416194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:28,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42660 samples/s/p 4:05:42 } +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1377/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.3410974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43992 samples/s/p 4:05:03 } +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1379/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 2.3405755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:34,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42689 samples/s/p 4:05:35 } +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1381/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.340053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43912 samples/s/p 4:04:59 } +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1383/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.3395305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43488 samples/s/p 4:05:07 } +2024-07-25 21:04:43,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1385/ 1625], loss: 1.235, per_step_time: 1470ms, lr: 2.3390083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43931 samples/s/p 4:04:53 } +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1387/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.3384853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.44018 samples/s/p 4:04:47 } +2024-07-25 21:04:49,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1389/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.3379625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:49,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43067 samples/s/p 4:05:10 } +2024-07-25 21:04:52,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1391/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.3374394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:52,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43701 samples/s/p 4:04:50 } +2024-07-25 21:04:55,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1393/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.3369164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43652 samples/s/p 4:04:48 } +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1395/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.336393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:58,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42998 samples/s/p 4:05:03 } +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1397/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.3358696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:01,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43459 samples/s/p 4:04:48 } +2024-07-25 21:05:04,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1399/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.3353461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:04,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43608 samples/s/p 4:04:41 } +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1401/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.334822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43105 samples/s/p 4:04:51 } +2024-07-25 21:05:10,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1403/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.3342984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:10,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42680 samples/s/p 4:05:00 } +2024-07-25 21:05:13,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1405/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.3337743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:13,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43128 samples/s/p 4:04:45 } +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1407/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.3332504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43248 samples/s/p 4:04:39 } +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1409/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.3327257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43162 samples/s/p 4:04:38 } +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1411/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.3322013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43653 samples/s/p 4:04:22 } +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1413/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.3316768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:25,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43246 samples/s/p 4:04:30 } +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1415/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 2.3311522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44178 samples/s/p 4:04:02 } +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1417/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.3306273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43251 samples/s/p 4:04:24 } +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1419/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.3301021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:33,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43980 samples/s/p 4:04:01 } +2024-07-25 21:05:36,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1421/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.329577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:36,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43151 samples/s/p 4:04:21 } +2024-07-25 21:05:39,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1423/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.3290517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:39,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43902 samples/s/p 4:03:57 } +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1425/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.3285264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:42,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43808 samples/s/p 4:03:57 } +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1427/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 2.3280007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43121 samples/s/p 4:04:13 } +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1429/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.3274748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43420 samples/s/p 4:04:02 } +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1431/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 2.326949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:51,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.42479 samples/s/p 4:04:24 } +2024-07-25 21:05:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1433/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.3264229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:54,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43450 samples/s/p 4:03:55 } +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1435/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.3258966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43708 samples/s/p 4:03:45 } +2024-07-25 21:06:00,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1437/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.3253704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:00,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43190 samples/s/p 4:03:56 } +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1439/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.324844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43101 samples/s/p 4:03:55 } +2024-07-25 21:06:06,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1441/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.324317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43546 samples/s/p 4:03:41 } +2024-07-25 21:06:09,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1443/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3237904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:09,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43398 samples/s/p 4:03:42 } +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1445/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.3232637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:12,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.42590 samples/s/p 4:04:00 } +2024-07-25 21:06:15,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1447/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.3227365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:15,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43357 samples/s/p 4:03:37 } +2024-07-25 21:06:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1449/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 2.3222094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:18,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43380 samples/s/p 4:03:33 } +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1451/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 2.321682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43228 samples/s/p 4:03:34 } +2024-07-25 21:06:24,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1453/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3211544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:24,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43348 samples/s/p 4:03:28 } +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1455/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.3206267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43253 samples/s/p 4:03:28 } +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1457/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.3200992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43468 samples/s/p 4:03:19 } +2024-07-25 21:06:32,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1459/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.3195713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:32,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43096 samples/s/p 4:03:26 } +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1461/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.319043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43648 samples/s/p 4:03:08 } +2024-07-25 21:06:38,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1463/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.3185148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:38,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43697 samples/s/p 4:03:04 } +2024-07-25 21:06:41,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1465/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.3179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:41,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.44233 samples/s/p 4:02:47 } +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1467/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.317458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43533 samples/s/p 4:03:03 } +2024-07-25 21:06:47,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1469/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.3169294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:47,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43397 samples/s/p 4:03:03 } +2024-07-25 21:06:50,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1471/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.3164008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:50,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43571 samples/s/p 4:02:56 } +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1473/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.3158722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43801 samples/s/p 4:02:47 } +2024-07-25 21:06:56,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1475/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.3153427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:56,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43197 samples/s/p 4:03:00 } +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1477/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.3148137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:59,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43537 samples/s/p 4:02:48 } +2024-07-25 21:07:02,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1479/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.3142846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:02,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.42856 samples/s/p 4:03:03 } +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1481/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.313755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43680 samples/s/p 4:02:38 } +2024-07-25 21:07:08,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1483/ 1625], loss: 0.946, per_step_time: 1470ms, lr: 2.3132252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:08,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43966 samples/s/p 4:02:27 } +2024-07-25 21:07:11,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1485/ 1625], loss: 1.296, per_step_time: 1470ms, lr: 2.3126957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:11,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43851 samples/s/p 4:02:28 } +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1487/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3121658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:14,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42945 samples/s/p 4:02:49 } +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1489/ 1625], loss: 0.995, per_step_time: 1472ms, lr: 2.3116358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43240 samples/s/p 4:02:38 } +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1491/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 2.3111055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43329 samples/s/p 4:02:33 } +2024-07-25 21:07:23,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1493/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.3105753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:23,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43174 samples/s/p 4:02:34 } +2024-07-25 21:07:26,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1495/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.310045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43858 samples/s/p 4:02:13 } +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1497/ 1625], loss: 0.863, per_step_time: 1473ms, lr: 2.3095143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42837 samples/s/p 4:02:37 } +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1499/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.3089835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43550 samples/s/p 4:02:15 } +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1501/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3084529e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43573 samples/s/p 4:02:11 } +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1503/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.307922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43594 samples/s/p 4:02:08 } +2024-07-25 21:07:40,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1505/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.3073904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:40,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43430 samples/s/p 4:02:09 } +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1507/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3068595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43749 samples/s/p 4:01:58 } +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1509/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.306328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43122 samples/s/p 4:02:12 } +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1511/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.3057966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:49,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43796 samples/s/p 4:01:51 } +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1513/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.3052648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:52,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.42979 samples/s/p 4:02:10 } +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1515/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3047329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43232 samples/s/p 4:02:00 } +2024-07-25 21:07:58,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1517/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.3042008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:58,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43315 samples/s/p 4:01:55 } +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1519/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3036688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:01,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43180 samples/s/p 4:01:56 } +2024-07-25 21:08:04,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1521/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.3031364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:04,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43793 samples/s/p 4:01:36 } +2024-07-25 21:08:07,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1523/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 2.302604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:07,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43852 samples/s/p 4:01:32 } +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1525/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3020715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43809 samples/s/p 4:01:30 } +2024-07-25 21:08:13,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1527/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.301539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:13,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43703 samples/s/p 4:01:30 } +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1529/ 1625], loss: 1.072, per_step_time: 1473ms, lr: 2.301006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.42993 samples/s/p 4:01:46 } +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1531/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.300473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43495 samples/s/p 4:01:29 } +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1533/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.29994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43153 samples/s/p 4:01:36 } +2024-07-25 21:08:25,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1535/ 1625], loss: 1.288, per_step_time: 1472ms, lr: 2.2994067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:25,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43478 samples/s/p 4:01:24 } +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1537/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.2988734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:28,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43809 samples/s/p 4:01:12 } +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1539/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.2983397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:30,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43690 samples/s/p 4:01:12 } +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1541/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.2978062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.42695 samples/s/p 4:01:36 } +2024-07-25 21:08:36,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1543/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.2972723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:36,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43129 samples/s/p 4:01:22 } +2024-07-25 21:08:39,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1545/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 2.2967384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:39,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43379 samples/s/p 4:01:12 } +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1547/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2962042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43818 samples/s/p 4:00:57 } +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1549/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.2956701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43618 samples/s/p 4:01:00 } +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1551/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.2951357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:48,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43781 samples/s/p 4:00:52 } +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1553/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.2946011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42583 samples/s/p 4:01:21 } +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1555/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.2940667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43554 samples/s/p 4:00:53 } +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1557/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 2.2935319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43648 samples/s/p 4:00:47 } +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1559/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.2929971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43480 samples/s/p 4:00:49 } +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1561/ 1625], loss: 1.404, per_step_time: 1473ms, lr: 2.292462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42917 samples/s/p 4:01:01 } +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1563/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.2919272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:06,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43384 samples/s/p 4:00:45 } +2024-07-25 21:09:09,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1565/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.2913915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:09,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43520 samples/s/p 4:00:39 } +2024-07-25 21:09:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1567/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.2908564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43484 samples/s/p 4:00:37 } +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1569/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.2903208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43192 samples/s/p 4:00:42 } +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1571/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.2897852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43215 samples/s/p 4:00:38 } +2024-07-25 21:09:21,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1573/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.2892493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43238 samples/s/p 4:00:34 } +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1575/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.288713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43767 samples/s/p 4:00:17 } +2024-07-25 21:09:27,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1577/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.2881772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:27,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43615 samples/s/p 4:00:19 } +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1579/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.2876407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43215 samples/s/p 4:00:26 } +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1581/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.2871045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43060 samples/s/p 4:00:27 } +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1583/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.286568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43415 samples/s/p 4:00:15 } +2024-07-25 21:09:38,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1585/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2860315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:38,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43560 samples/s/p 4:00:08 } +2024-07-25 21:09:41,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1587/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.2854943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:41,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43650 samples/s/p 4:00:03 } +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1589/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2849577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43006 samples/s/p 4:00:17 } +2024-07-25 21:09:47,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1591/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2844208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:47,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43722 samples/s/p 3:59:55 } +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1593/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.2838836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43580 samples/s/p 3:59:56 } +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1595/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.283346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:53,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.44095 samples/s/p 3:59:39 } +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1597/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2828086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43559 samples/s/p 3:59:51 } +2024-07-25 21:09:59,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1599/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.282271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:59,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.44056 samples/s/p 3:59:34 } +2024-07-25 21:10:02,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1601/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.2817332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:02,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43719 samples/s/p 3:59:40 } +2024-07-25 21:10:05,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1603/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.2811953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:05,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43695 samples/s/p 3:59:38 } +2024-07-25 21:10:08,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1605/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.2806575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43892 samples/s/p 3:59:30 } +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1607/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.2801192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43283 samples/s/p 3:59:43 } +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1609/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.279581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.44035 samples/s/p 3:59:20 } +2024-07-25 21:10:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1611/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.2790426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:17,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43366 samples/s/p 3:59:35 } +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1613/ 1625], loss: 1.236, per_step_time: 1476ms, lr: 2.278504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:20,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.41872 samples/s/p 4:00:12 } +2024-07-25 21:10:23,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1615/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2779652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:23,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43839 samples/s/p 3:59:17 } +2024-07-25 21:10:26,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1617/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.2774264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:26,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43500 samples/s/p 3:59:23 } +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1619/ 1625], loss: 1.268, per_step_time: 1470ms, lr: 2.2768874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43962 samples/s/p 3:59:08 } +2024-07-25 21:10:32,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1621/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 2.2763483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:32,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.44100 samples/s/p 3:59:01 } +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1623/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2758091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:34,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43558 samples/s/p 3:59:12 } +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1625/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 2.2752696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43747 samples/s/p 3:59:04 } +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 2/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.2747303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43505 samples/s/p 3:59:08 } +2024-07-25 21:10:43,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 4/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.2741906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:43,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43179 samples/s/p 3:59:14 } +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 6/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.2736509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:46,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43234 samples/s/p 3:59:09 } +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 8/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.2731108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:49,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43649 samples/s/p 3:58:55 } +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 10/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.2725708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:52,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43822 samples/s/p 3:58:48 } +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 12/ 1625], loss: 1.227, per_step_time: 1478ms, lr: 2.2720307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.41223 samples/s/p 3:59:54 } +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 14/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.2714903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43476 samples/s/p 3:58:51 } +2024-07-25 21:11:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 16/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.27095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42944 samples/s/p 3:59:02 } +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 18/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 2.2704093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43550 samples/s/p 3:58:43 } +2024-07-25 21:11:07,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 20/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.2698687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:07,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42883 samples/s/p 3:58:58 } +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 22/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.2693279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43963 samples/s/p 3:58:26 } +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 24/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.268787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43274 samples/s/p 3:58:42 } +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 26/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.2682461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.44215 samples/s/p 3:58:14 } +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 28/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.2677044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43550 samples/s/p 3:58:28 } +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 30/ 1625], loss: 1.344, per_step_time: 1474ms, lr: 2.2671631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42671 samples/s/p 3:58:49 } +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 32/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.2666221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43343 samples/s/p 3:58:28 } +2024-07-25 21:11:28,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 34/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.2660804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:28,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43160 samples/s/p 3:58:30 } +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 36/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43597 samples/s/p 3:58:15 } +2024-07-25 21:11:33,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 38/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.2649967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:33,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42991 samples/s/p 3:58:28 } +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 40/ 1625], loss: 1.410, per_step_time: 1471ms, lr: 2.2644546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43790 samples/s/p 3:58:04 } +2024-07-25 21:11:39,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 42/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.2639124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43665 samples/s/p 3:58:05 } +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 44/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2633702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:42,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43892 samples/s/p 3:57:56 } +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 46/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.2628277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43957 samples/s/p 3:57:51 } +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 48/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.2622855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43610 samples/s/p 3:57:57 } +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 50/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.2617425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42744 samples/s/p 3:58:17 } +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 52/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.2611997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42716 samples/s/p 3:58:15 } +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 54/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2606571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43717 samples/s/p 3:57:46 } +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 56/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.260114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43471 samples/s/p 3:57:49 } +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 58/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.2595706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:03,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43608 samples/s/p 3:57:43 } +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 60/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.2590275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43367 samples/s/p 3:57:46 } +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 62/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.258484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:09,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43411 samples/s/p 3:57:42 } +2024-07-25 21:12:12,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 64/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.2579403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43646 samples/s/p 3:57:33 } +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 66/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.2573966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43895 samples/s/p 3:57:23 } +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 68/ 1625], loss: 1.121, per_step_time: 1477ms, lr: 2.2568527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:18,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.41557 samples/s/p 3:58:22 } +2024-07-25 21:12:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 70/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2563088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43510 samples/s/p 3:57:28 } +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 72/ 1625], loss: 1.486, per_step_time: 1472ms, lr: 2.2557646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43389 samples/s/p 3:57:28 } +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 74/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.2552204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43152 samples/s/p 3:57:31 } +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 76/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.254676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:30,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43577 samples/s/p 3:57:17 } +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 78/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.2541315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43715 samples/s/p 3:57:10 } +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 80/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.2535869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43133 samples/s/p 3:57:23 } +2024-07-25 21:12:38,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 82/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.2530421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:38,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43533 samples/s/p 3:57:09 } +2024-07-25 21:12:41,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 84/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 2.2524971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:41,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43363 samples/s/p 3:57:11 } +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 86/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.2519522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:44,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43373 samples/s/p 3:57:08 } +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 88/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.251407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:47,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.42805 samples/s/p 3:57:20 } +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 90/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 2.2508617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.42459 samples/s/p 3:57:26 } +2024-07-25 21:12:53,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 92/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.2503164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43944 samples/s/p 3:56:44 } +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 94/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.2497707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43440 samples/s/p 3:56:54 } +2024-07-25 21:12:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 96/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2492251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:59,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43591 samples/s/p 3:56:47 } +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 98/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.2486793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43634 samples/s/p 3:56:43 } +2024-07-25 21:13:05,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 100/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.2481334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:05,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43545 samples/s/p 3:56:43 } +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 102/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2475871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43586 samples/s/p 3:56:39 } +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 104/ 1625], loss: 1.066, per_step_time: 1469ms, lr: 2.247041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.44234 samples/s/p 3:56:19 } +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 106/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2464947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43842 samples/s/p 3:56:26 } +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 108/ 1625], loss: 1.106, per_step_time: 1469ms, lr: 2.245948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.44236 samples/s/p 3:56:13 } +2024-07-25 21:13:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 110/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.2454016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43017 samples/s/p 3:56:42 } +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 112/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.2448548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43809 samples/s/p 3:56:18 } +2024-07-25 21:13:26,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 114/ 1625], loss: 0.954, per_step_time: 1470ms, lr: 2.244308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:26,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43887 samples/s/p 3:56:13 } +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 116/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.2437613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:29,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.42976 samples/s/p 3:56:34 } +2024-07-25 21:13:32,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 118/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 2.243214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:32,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43203 samples/s/p 3:56:25 } +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 120/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.242667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43251 samples/s/p 3:56:21 } +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 122/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2421198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43337 samples/s/p 3:56:16 } +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 124/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.2415721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43803 samples/s/p 3:56:01 } +2024-07-25 21:13:43,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 126/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.2410246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42915 samples/s/p 3:56:21 } +2024-07-25 21:13:46,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 128/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2404767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:46,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43350 samples/s/p 3:56:06 } +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 130/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.239929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:49,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42793 samples/s/p 3:56:18 } +2024-07-25 21:13:52,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 132/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 2.2393811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:52,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.44047 samples/s/p 3:55:42 } +2024-07-25 21:13:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 134/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.2388327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:55,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43650 samples/s/p 3:55:50 } +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 136/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 2.2382847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43240 samples/s/p 3:55:58 } +2024-07-25 21:14:01,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 138/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.2377366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:01,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43762 samples/s/p 3:55:41 } +2024-07-25 21:14:04,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 140/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.2371878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:04,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.44057 samples/s/p 3:55:30 } +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 142/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.2366394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:07,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43088 samples/s/p 3:55:53 } +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 144/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2360906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:10,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43339 samples/s/p 3:55:43 } +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 146/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.2355418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:13,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43576 samples/s/p 3:55:34 } +2024-07-25 21:14:16,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 148/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 2.2349928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:16,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43536 samples/s/p 3:55:32 } +2024-07-25 21:14:19,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 150/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2344437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43713 samples/s/p 3:55:25 } +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 152/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.2338943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43221 samples/s/p 3:55:34 } +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 154/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.233345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43861 samples/s/p 3:55:15 } +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 156/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.2327955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43338 samples/s/p 3:55:26 } +2024-07-25 21:14:31,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 158/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.232246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:31,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.42855 samples/s/p 3:55:35 } +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 160/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.2316963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43580 samples/s/p 3:55:13 } +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 162/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.2311464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43328 samples/s/p 3:55:17 } +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 164/ 1625], loss: 1.055, per_step_time: 1469ms, lr: 2.2305963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.44345 samples/s/p 3:54:48 } +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 166/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.230046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:42,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43296 samples/s/p 3:55:12 } +2024-07-25 21:14:45,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 168/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.229496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:45,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43045 samples/s/p 3:55:15 } +2024-07-25 21:14:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 170/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2289454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:48,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43687 samples/s/p 3:54:56 } +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 172/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.2283948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43018 samples/s/p 3:55:10 } +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 174/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2278444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44052 samples/s/p 3:54:41 } +2024-07-25 21:14:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 176/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.2272936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43394 samples/s/p 3:54:55 } +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 178/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.2267428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43565 samples/s/p 3:54:47 } +2024-07-25 21:15:03,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 180/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 2.2261916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:03,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44267 samples/s/p 3:54:26 } +2024-07-25 21:15:06,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 182/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2256405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:06,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43729 samples/s/p 3:54:37 } +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 184/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.2250892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:09,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43342 samples/s/p 3:54:44 } +2024-07-25 21:15:12,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 186/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 2.2245378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:12,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44218 samples/s/p 3:54:19 } +2024-07-25 21:15:15,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 188/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.2239865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:15,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43726 samples/s/p 3:54:28 } +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 190/ 1625], loss: 1.009, per_step_time: 1469ms, lr: 2.2234346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.44316 samples/s/p 3:54:10 } +2024-07-25 21:15:21,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 192/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.2228829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:21,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43588 samples/s/p 3:54:26 } +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 194/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.222331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43208 samples/s/p 3:54:33 } +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 196/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.2217791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43314 samples/s/p 3:54:27 } +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 198/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.2212269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:30,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43736 samples/s/p 3:54:13 } +2024-07-25 21:15:33,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 200/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.2206747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:33,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43468 samples/s/p 3:54:17 } +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 202/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.2201222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43231 samples/s/p 3:54:21 } +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 204/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.21957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:38,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43037 samples/s/p 3:54:23 } +2024-07-25 21:15:41,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 206/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2190172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.44202 samples/s/p 3:53:50 } +2024-07-25 21:15:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 208/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.2184644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43271 samples/s/p 3:54:11 } +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 210/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.2179118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43291 samples/s/p 3:54:07 } +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 212/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2173588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43636 samples/s/p 3:53:55 } +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 214/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 2.2168053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.42951 samples/s/p 3:54:10 } +2024-07-25 21:15:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 216/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2162525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43498 samples/s/p 3:53:53 } +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.2156992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43616 samples/s/p 3:53:47 } +2024-07-25 21:16:02,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 220/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.2151457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:02,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43774 samples/s/p 3:53:40 } +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 222/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.214592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43614 samples/s/p 3:53:41 } +2024-07-25 21:16:08,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 224/ 1625], loss: 0.893, per_step_time: 1471ms, lr: 2.2140382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:08,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43681 samples/s/p 3:53:37 } +2024-07-25 21:16:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 226/ 1625], loss: 1.085, per_step_time: 1470ms, lr: 2.2134847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43997 samples/s/p 3:53:25 } +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 228/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2129307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43423 samples/s/p 3:53:37 } +2024-07-25 21:16:17,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 230/ 1625], loss: 0.865, per_step_time: 1471ms, lr: 2.2123762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:17,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43534 samples/s/p 3:53:31 } +2024-07-25 21:16:20,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 232/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.2118224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43273 samples/s/p 3:53:35 } +2024-07-25 21:16:23,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 234/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.211268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:23,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43299 samples/s/p 3:53:32 } +2024-07-25 21:16:26,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 236/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.2107135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:26,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43368 samples/s/p 3:53:27 } +2024-07-25 21:16:29,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 238/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.210159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:29,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43680 samples/s/p 3:53:16 } +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 240/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.2096043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43627 samples/s/p 3:53:14 } +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 242/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.2090495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:35,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43637 samples/s/p 3:53:11 } +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 244/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.2084943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43774 samples/s/p 3:53:05 } +2024-07-25 21:16:40,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2079394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:40,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43497 samples/s/p 3:53:09 } +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 248/ 1625], loss: 1.072, per_step_time: 1472ms, lr: 2.2073842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43300 samples/s/p 3:53:11 } +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 250/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.2068289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43568 samples/s/p 3:53:01 } +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 252/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.2062733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43898 samples/s/p 3:52:50 } +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 254/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.2057178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42994 samples/s/p 3:53:10 } +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 256/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.2051621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43252 samples/s/p 3:53:00 } +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 258/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 2.2046064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42902 samples/s/p 3:53:07 } +2024-07-25 21:17:01,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 260/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.2040504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:01,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43599 samples/s/p 3:52:46 } +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 262/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.2034943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43407 samples/s/p 3:52:48 } +2024-07-25 21:17:07,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 264/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 2.2029382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43044 samples/s/p 3:52:54 } +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 266/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.2023818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43257 samples/s/p 3:52:46 } +2024-07-25 21:17:13,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 268/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2018256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.44108 samples/s/p 3:52:21 } +2024-07-25 21:17:16,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 270/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.201269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:16,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.42992 samples/s/p 3:52:47 } +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 272/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2007122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43982 samples/s/p 3:52:18 } +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 274/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.2001554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43816 samples/s/p 3:52:20 } +2024-07-25 21:17:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 276/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1995987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44145 samples/s/p 3:52:08 } +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 278/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.1990416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:28,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43683 samples/s/p 3:52:17 } +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 280/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.1984844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44182 samples/s/p 3:52:01 } +2024-07-25 21:17:34,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 282/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 2.1979271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:34,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43162 samples/s/p 3:52:25 } +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 284/ 1625], loss: 1.397, per_step_time: 1470ms, lr: 2.19737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:36,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43897 samples/s/p 3:52:03 } +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 286/ 1625], loss: 1.279, per_step_time: 1474ms, lr: 2.1968124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:39,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42389 samples/s/p 3:52:38 } +2024-07-25 21:17:42,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 288/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.1962549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43136 samples/s/p 3:52:16 } +2024-07-25 21:17:45,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 290/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.195697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:45,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43786 samples/s/p 3:51:57 } +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 292/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.1951395e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43825 samples/s/p 3:51:53 } +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 294/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.1945816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:51,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43280 samples/s/p 3:52:04 } +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 296/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.1940232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42812 samples/s/p 3:52:13 } +2024-07-25 21:17:57,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 298/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.1934653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:57,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43662 samples/s/p 3:51:48 } +2024-07-25 21:18:00,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 300/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.192907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43689 samples/s/p 3:51:45 } +2024-07-25 21:18:03,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 302/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1923484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:03,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43530 samples/s/p 3:51:46 } +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 304/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.1917898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42859 samples/s/p 3:52:00 } +2024-07-25 21:18:09,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 306/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.1912314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:09,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43224 samples/s/p 3:51:48 } +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 308/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1906724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42928 samples/s/p 3:51:52 } +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 310/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.1901134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:15,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43428 samples/s/p 3:51:36 } +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 312/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.1895545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:18,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42772 samples/s/p 3:51:50 } +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 314/ 1625], loss: 1.071, per_step_time: 1477ms, lr: 2.1889953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.41630 samples/s/p 3:52:17 } +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 316/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.1884363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.44078 samples/s/p 3:51:11 } +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 318/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.1878766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43453 samples/s/p 3:51:24 } +2024-07-25 21:18:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 320/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.1873175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43034 samples/s/p 3:51:32 } +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 322/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.186758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43120 samples/s/p 3:51:27 } +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 324/ 1625], loss: 0.832, per_step_time: 1471ms, lr: 2.1861983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43509 samples/s/p 3:51:14 } +2024-07-25 21:18:38,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 326/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 2.1856382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:38,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.44062 samples/s/p 3:50:57 } +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 328/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.1850783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:41,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43667 samples/s/p 3:51:04 } +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 330/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1845182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43382 samples/s/p 3:51:08 } +2024-07-25 21:18:47,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.183958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:47,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43532 samples/s/p 3:51:01 } +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 334/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.1833976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43604 samples/s/p 3:50:57 } +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 336/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.1828373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:53,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43984 samples/s/p 3:50:44 } +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 338/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 2.1822767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:56,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43859 samples/s/p 3:50:44 } +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 340/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.1817159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43367 samples/s/p 3:50:54 } +2024-07-25 21:19:02,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 342/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.1811553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:02,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43910 samples/s/p 3:50:37 } +2024-07-25 21:19:05,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 344/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.1805943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:05,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43638 samples/s/p 3:50:41 } +2024-07-25 21:19:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 346/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.1800332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43598 samples/s/p 3:50:39 } +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 348/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.1794722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:11,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43865 samples/s/p 3:50:29 } +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 350/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.1789108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43929 samples/s/p 3:50:25 } +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 352/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1783495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43500 samples/s/p 3:50:33 } +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 354/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.177788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43672 samples/s/p 3:50:25 } +2024-07-25 21:19:23,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 356/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.1772265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44088 samples/s/p 3:50:12 } +2024-07-25 21:19:26,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 358/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.1766646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:26,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43556 samples/s/p 3:50:23 } +2024-07-25 21:19:29,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 360/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.1761029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:29,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43510 samples/s/p 3:50:21 } +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 362/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 2.1755408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43056 samples/s/p 3:50:29 } +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 364/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.1749787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44046 samples/s/p 3:50:01 } +2024-07-25 21:19:37,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 366/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 2.1744167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:37,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43524 samples/s/p 3:50:12 } +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 368/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.1738544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44171 samples/s/p 3:49:52 } +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 370/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.173292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:43,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43588 samples/s/p 3:50:04 } +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 372/ 1625], loss: 0.984, per_step_time: 1469ms, lr: 2.1727295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:46,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44427 samples/s/p 3:49:40 } +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1721668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43675 samples/s/p 3:49:56 } +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 376/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.1716038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:52,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43280 samples/s/p 3:50:03 } +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 378/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.171041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:55,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43502 samples/s/p 3:49:54 } +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 380/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.170478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:58,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43754 samples/s/p 3:49:45 } +2024-07-25 21:20:01,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 382/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.1699154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:01,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43285 samples/s/p 3:49:54 } +2024-07-25 21:20:04,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 384/ 1625], loss: 1.186, per_step_time: 1469ms, lr: 2.169352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:04,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.44414 samples/s/p 3:49:23 } +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 386/ 1625], loss: 1.215, per_step_time: 1474ms, lr: 2.1687883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:07,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42442 samples/s/p 3:50:10 } +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 388/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.1682252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:10,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43663 samples/s/p 3:49:36 } +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 390/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.1676618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:13,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43009 samples/s/p 3:49:49 } +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 392/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.1670981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42989 samples/s/p 3:49:47 } +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 394/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.1665343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:19,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43111 samples/s/p 3:49:41 } +2024-07-25 21:20:22,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 396/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.1659704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:22,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43866 samples/s/p 3:49:19 } +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 398/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 2.1654067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43033 samples/s/p 3:49:37 } +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 400/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.1648422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43118 samples/s/p 3:49:32 } +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 402/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.164278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:31,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43460 samples/s/p 3:49:20 } +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 404/ 1625], loss: 1.232, per_step_time: 1474ms, lr: 2.1637139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42479 samples/s/p 3:49:42 } +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 406/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.1631497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44100 samples/s/p 3:48:58 } +2024-07-25 21:20:39,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 408/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.1625845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43166 samples/s/p 3:49:19 } +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 410/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.1620202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:42,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43762 samples/s/p 3:49:01 } +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 412/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.1614554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:45,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44073 samples/s/p 3:48:50 } +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 414/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.1608905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:48,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42939 samples/s/p 3:49:16 } +2024-07-25 21:20:51,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 416/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.1603255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:51,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43969 samples/s/p 3:48:47 } +2024-07-25 21:20:54,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 418/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.1597603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:54,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43789 samples/s/p 3:48:48 } +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 420/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.159195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.42887 samples/s/p 3:49:08 } +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 422/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.1586296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43659 samples/s/p 3:48:46 } +2024-07-25 21:21:03,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 424/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.1580643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:03,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43813 samples/s/p 3:48:39 } +2024-07-25 21:21:06,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 426/ 1625], loss: 1.124, per_step_time: 1469ms, lr: 2.1574986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:06,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44250 samples/s/p 3:48:25 } +2024-07-25 21:21:09,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 428/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1569329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:09,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43883 samples/s/p 3:48:31 } +2024-07-25 21:21:12,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 430/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.1563672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:12,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44101 samples/s/p 3:48:23 } +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 432/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1558013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44132 samples/s/p 3:48:19 } +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 434/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.1552352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43447 samples/s/p 3:48:33 } +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 436/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.1546688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43671 samples/s/p 3:48:25 } +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 438/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.1541025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:24,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42904 samples/s/p 3:48:41 } +2024-07-25 21:21:27,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 440/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 2.1535363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:27,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43586 samples/s/p 3:48:21 } +2024-07-25 21:21:30,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 442/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.1529699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:30,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43471 samples/s/p 3:48:21 } +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 444/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 2.1524032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42923 samples/s/p 3:48:32 } +2024-07-25 21:21:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 446/ 1625], loss: 1.057, per_step_time: 1469ms, lr: 2.1518365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:36,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44264 samples/s/p 3:47:55 } +2024-07-25 21:21:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 448/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.1512697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43524 samples/s/p 3:48:11 } +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 450/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.1507029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43182 samples/s/p 3:48:17 } +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 452/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.1501357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:44,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43284 samples/s/p 3:48:11 } +2024-07-25 21:21:47,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 454/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.1495687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:47,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.42494 samples/s/p 3:48:28 } +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 456/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 2.1490014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:50,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43566 samples/s/p 3:47:58 } +2024-07-25 21:21:53,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 458/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.148434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:53,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43245 samples/s/p 3:48:03 } +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 460/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.1478665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43786 samples/s/p 3:47:47 } +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 462/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.147299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43716 samples/s/p 3:47:45 } +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 464/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.1467313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43505 samples/s/p 3:47:48 } +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 466/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.1461634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.42981 samples/s/p 3:47:58 } +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 468/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.1455955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43500 samples/s/p 3:47:42 } +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 470/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.1450276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43608 samples/s/p 3:47:36 } +2024-07-25 21:22:14,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 472/ 1625], loss: 0.970, per_step_time: 1471ms, lr: 2.1444595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:14,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43565 samples/s/p 3:47:35 } +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 474/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.143891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.44197 samples/s/p 3:47:16 } +2024-07-25 21:22:20,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 476/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.1433229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:20,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43542 samples/s/p 3:47:29 } +2024-07-25 21:22:23,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 478/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.1427542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43114 samples/s/p 3:47:37 } +2024-07-25 21:22:26,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 480/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.1421858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:26,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43667 samples/s/p 3:47:20 } +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.141617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:29,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43891 samples/s/p 3:47:12 } +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 484/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 2.1410482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44349 samples/s/p 3:46:57 } +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 486/ 1625], loss: 1.282, per_step_time: 1468ms, lr: 2.1404794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:35,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44654 samples/s/p 3:46:47 } +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 488/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1399102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43697 samples/s/p 3:47:08 } +2024-07-25 21:22:40,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 490/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.139341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:40,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44138 samples/s/p 3:46:54 } +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 492/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.1387721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43479 samples/s/p 3:47:07 } +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 494/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.1382028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43313 samples/s/p 3:47:08 } +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 496/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 2.137633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43772 samples/s/p 3:46:54 } +2024-07-25 21:22:52,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 498/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.1370637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:52,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43440 samples/s/p 3:46:59 } +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 500/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.136494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43703 samples/s/p 3:46:50 } +2024-07-25 21:22:55,671 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 502/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 2.1359243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.42826 samples/s/p 3:47:09 } +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 504/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.1353544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.42081 samples/s/p 3:47:25 } +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 506/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.1347843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43455 samples/s/p 3:46:47 } +2024-07-25 21:23:40,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 508/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1342143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:40,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43032 samples/s/p 3:46:55 } +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 510/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 2.133644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:43,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43533 samples/s/p 3:46:39 } +2024-07-25 21:23:46,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 512/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.1330738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:46,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43067 samples/s/p 3:46:48 } +2024-07-25 21:23:49,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 514/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 2.1325033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:49,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43795 samples/s/p 3:46:27 } +2024-07-25 21:23:52,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 516/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.1319329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:52,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43174 samples/s/p 3:46:40 } +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.1313623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43169 samples/s/p 3:46:37 } +2024-07-25 21:23:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 520/ 1625], loss: 1.310, per_step_time: 1473ms, lr: 2.1307915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:57,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43060 samples/s/p 3:46:37 } +2024-07-25 21:24:00,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 522/ 1625], loss: 1.320, per_step_time: 1470ms, lr: 2.1302207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:00,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43862 samples/s/p 3:46:14 } +2024-07-25 21:24:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 524/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.1296497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:03,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43655 samples/s/p 3:46:16 } +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 526/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.1290785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43387 samples/s/p 3:46:19 } +2024-07-25 21:24:09,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 528/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.1285074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:09,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43748 samples/s/p 3:46:08 } +2024-07-25 21:24:12,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 530/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 2.1279362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:12,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.44344 samples/s/p 3:45:50 } +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 532/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 2.1273649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43974 samples/s/p 3:45:56 } +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 534/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.1267933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43508 samples/s/p 3:46:05 } +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 536/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.1262214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43474 samples/s/p 3:46:03 } +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 538/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.1256501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43637 samples/s/p 3:45:56 } +2024-07-25 21:24:27,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 540/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 2.125078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:27,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43574 samples/s/p 3:45:54 } +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 542/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.1245063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43632 samples/s/p 3:45:50 } +2024-07-25 21:24:33,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 544/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.1239342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43283 samples/s/p 3:45:56 } +2024-07-25 21:24:36,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 546/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.1233622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:36,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44016 samples/s/p 3:45:34 } +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 548/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.12279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43444 samples/s/p 3:45:46 } +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 550/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.1222175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43891 samples/s/p 3:45:32 } +2024-07-25 21:24:45,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 552/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 2.121645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43709 samples/s/p 3:45:33 } +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 554/ 1625], loss: 0.905, per_step_time: 1470ms, lr: 2.1210728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43939 samples/s/p 3:45:25 } +2024-07-25 21:24:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 556/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.1204998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:51,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43206 samples/s/p 3:45:40 } +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 558/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.119927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43991 samples/s/p 3:45:17 } +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 560/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.1193544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43419 samples/s/p 3:45:29 } +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 562/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.1187814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:59,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43827 samples/s/p 3:45:16 } +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 564/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.118208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43863 samples/s/p 3:45:12 } +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 566/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.1176353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.44292 samples/s/p 3:44:58 } +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 568/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.117062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:08,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43262 samples/s/p 3:45:21 } +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 570/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.1164886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43069 samples/s/p 3:45:23 } +2024-07-25 21:25:14,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 572/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.1159149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:14,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43275 samples/s/p 3:45:15 } +2024-07-25 21:25:17,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 574/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.1153413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:17,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43433 samples/s/p 3:45:08 } +2024-07-25 21:25:20,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 576/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.1147678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43287 samples/s/p 3:45:08 } +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 578/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 2.1141937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.44452 samples/s/p 3:44:37 } +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 580/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.1136198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43355 samples/s/p 3:45:01 } +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 582/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 2.113046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42389 samples/s/p 3:45:22 } +2024-07-25 21:25:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 584/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.1124719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:32,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42794 samples/s/p 3:45:09 } +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 586/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1118974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43430 samples/s/p 3:44:50 } +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 588/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1113232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43822 samples/s/p 3:44:37 } +2024-07-25 21:25:41,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 590/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.110749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:41,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43131 samples/s/p 3:44:52 } +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 592/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.1101741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42879 samples/s/p 3:44:55 } +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 594/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 2.1095995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43565 samples/s/p 3:44:35 } +2024-07-25 21:25:50,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 596/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.1090249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:50,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43575 samples/s/p 3:44:32 } +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 598/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 2.1084501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:53,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44068 samples/s/p 3:44:17 } +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 600/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.107875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44056 samples/s/p 3:44:14 } +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 602/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.1073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43714 samples/s/p 3:44:20 } +2024-07-25 21:26:01,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 604/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.106725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:01,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42799 samples/s/p 3:44:39 } +2024-07-25 21:26:04,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 606/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.1061498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:04,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43430 samples/s/p 3:44:21 } +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 608/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.1055741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43807 samples/s/p 3:44:08 } +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 610/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.104999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44190 samples/s/p 3:43:56 } +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 612/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.1044234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:13,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44382 samples/s/p 3:43:48 } +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 614/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.1038477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43978 samples/s/p 3:43:55 } +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 616/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.1032718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43616 samples/s/p 3:44:01 } +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 618/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.1026959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43234 samples/s/p 3:44:08 } +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 620/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.1021202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:25,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43472 samples/s/p 3:43:59 } +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 622/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.101544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:28,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43590 samples/s/p 3:43:53 } +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 624/ 1625], loss: 1.141, per_step_time: 1475ms, lr: 2.1009677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.42355 samples/s/p 3:44:21 } +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 626/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.1003914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.42411 samples/s/p 3:44:16 } +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 628/ 1625], loss: 1.325, per_step_time: 1484ms, lr: 2.0998152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.38998 samples/s/p 3:45:39 } +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 630/ 1625], loss: 0.967, per_step_time: 1469ms, lr: 2.0992386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44256 samples/s/p 3:43:25 } +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 632/ 1625], loss: 1.023, per_step_time: 1470ms, lr: 2.0986621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44027 samples/s/p 3:43:28 } +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 634/ 1625], loss: 1.285, per_step_time: 1477ms, lr: 2.0980855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.41428 samples/s/p 3:44:29 } +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 636/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.0975087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43711 samples/s/p 3:43:30 } +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 638/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.0969317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43596 samples/s/p 3:43:29 } +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 640/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.0963547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43691 samples/s/p 3:43:24 } +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 642/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.0957777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43315 samples/s/p 3:43:30 } +2024-07-25 21:27:00,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 644/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.0952004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43128 samples/s/p 3:43:32 } +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 646/ 1625], loss: 0.978, per_step_time: 1472ms, lr: 2.094623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43362 samples/s/p 3:43:23 } +2024-07-25 21:27:06,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 648/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.0940459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:06,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43755 samples/s/p 3:43:11 } +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 650/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.0934684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43025 samples/s/p 3:43:26 } +2024-07-25 21:27:12,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 652/ 1625], loss: 0.972, per_step_time: 1473ms, lr: 2.0928905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43071 samples/s/p 3:43:22 } +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 654/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.0923131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43889 samples/s/p 3:42:59 } +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 656/ 1625], loss: 0.980, per_step_time: 1473ms, lr: 2.0917352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43076 samples/s/p 3:43:16 } +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 658/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0911573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42742 samples/s/p 3:43:21 } +2024-07-25 21:27:24,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 660/ 1625], loss: 1.027, per_step_time: 1482ms, lr: 2.0905793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.39514 samples/s/p 3:44:38 } +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 662/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.0900014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.42928 samples/s/p 3:43:11 } +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 664/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0894231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43880 samples/s/p 3:42:44 } +2024-07-25 21:27:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 666/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.0888447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43906 samples/s/p 3:42:41 } +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 668/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.0882664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43417 samples/s/p 3:42:50 } +2024-07-25 21:27:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 670/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.087688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:39,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43380 samples/s/p 3:42:48 } +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 672/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0871095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43890 samples/s/p 3:42:32 } +2024-07-25 21:27:45,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 674/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.0865305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:45,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43045 samples/s/p 3:42:50 } +2024-07-25 21:27:48,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 676/ 1625], loss: 0.871, per_step_time: 1470ms, lr: 2.085952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:48,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43891 samples/s/p 3:42:26 } +2024-07-25 21:27:51,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 678/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.085373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:51,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43751 samples/s/p 3:42:27 } +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 680/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.0847941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43381 samples/s/p 3:42:33 } +2024-07-25 21:27:57,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 682/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.084215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:57,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.42862 samples/s/p 3:42:43 } +2024-07-25 21:27:59,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 684/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 2.0836358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:59,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43607 samples/s/p 3:42:21 } +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 686/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.0830565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.44169 samples/s/p 3:42:05 } +2024-07-25 21:28:05,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 688/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.0824771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:05,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43594 samples/s/p 3:42:16 } +2024-07-25 21:28:08,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 690/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.0818976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43731 samples/s/p 3:42:10 } +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 692/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.081318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43984 samples/s/p 3:42:00 } +2024-07-25 21:28:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 694/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 2.0807383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44105 samples/s/p 3:41:55 } +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 696/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0801584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:17,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43688 samples/s/p 3:42:02 } +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 698/ 1625], loss: 1.093, per_step_time: 1474ms, lr: 2.0795787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.42700 samples/s/p 3:42:23 } +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 700/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.0789988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43326 samples/s/p 3:42:05 } +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 702/ 1625], loss: 0.915, per_step_time: 1472ms, lr: 2.0784188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:26,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43371 samples/s/p 3:42:01 } +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 704/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.0778387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43201 samples/s/p 3:42:02 } +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 706/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 2.0772584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43911 samples/s/p 3:41:42 } +2024-07-25 21:28:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 708/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.076678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:35,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43722 samples/s/p 3:41:43 } +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 710/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.0760977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43364 samples/s/p 3:41:49 } +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 712/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.075517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43002 samples/s/p 3:41:55 } +2024-07-25 21:28:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 714/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.0749363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42917 samples/s/p 3:41:54 } +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 716/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 2.0743557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43187 samples/s/p 3:41:45 } +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 718/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 2.0737749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42411 samples/s/p 3:42:01 } +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 720/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.0731939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43436 samples/s/p 3:41:33 } +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 722/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.0726127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43663 samples/s/p 3:41:24 } +2024-07-25 21:28:58,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 724/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.0720316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:58,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43618 samples/s/p 3:41:22 } +2024-07-25 21:29:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 726/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 2.0714504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:01,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43697 samples/s/p 3:41:17 } +2024-07-25 21:29:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 728/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.070869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:04,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43334 samples/s/p 3:41:23 } +2024-07-25 21:29:07,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 730/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0702877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:07,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43181 samples/s/p 3:41:24 } +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 732/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 2.0697064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43557 samples/s/p 3:41:12 } +2024-07-25 21:29:13,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 734/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.0691246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.44062 samples/s/p 3:40:57 } +2024-07-25 21:29:16,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 736/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.0685427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.42870 samples/s/p 3:41:23 } +2024-07-25 21:29:19,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 738/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.067961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:19,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43768 samples/s/p 3:40:58 } +2024-07-25 21:29:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 740/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.0673793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:22,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43653 samples/s/p 3:40:58 } +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 742/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.066797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43285 samples/s/p 3:41:04 } +2024-07-25 21:29:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 744/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.0662152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43187 samples/s/p 3:41:03 } +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 746/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.0656329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:31,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43761 samples/s/p 3:40:47 } +2024-07-25 21:29:34,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 748/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0650506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:34,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43065 samples/s/p 3:41:01 } +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 750/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0644682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43977 samples/s/p 3:40:35 } +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 752/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0638858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43239 samples/s/p 3:40:50 } +2024-07-25 21:29:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 754/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.0633033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:43,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43076 samples/s/p 3:40:51 } +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 756/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.0627205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43866 samples/s/p 3:40:29 } +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 758/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.0621379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:49,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43649 samples/s/p 3:40:32 } +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 760/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.061555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44249 samples/s/p 3:40:14 } +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 762/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.0609721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43770 samples/s/p 3:40:23 } +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 764/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.060389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43991 samples/s/p 3:40:14 } +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 766/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0598058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43503 samples/s/p 3:40:23 } +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 768/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.0592226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44046 samples/s/p 3:40:07 } +2024-07-25 21:30:06,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 770/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0586393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44159 samples/s/p 3:40:02 } +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 772/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 2.0580559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:09,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43026 samples/s/p 3:40:26 } +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 774/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.0574724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43172 samples/s/p 3:40:20 } +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 776/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.056889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43274 samples/s/p 3:40:14 } +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 778/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 2.0563051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:18,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43595 samples/s/p 3:40:03 } +2024-07-25 21:30:21,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 780/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0557212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:21,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43767 samples/s/p 3:39:56 } +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 782/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.0551375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44176 samples/s/p 3:39:43 } +2024-07-25 21:30:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 784/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.0545536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:27,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43373 samples/s/p 3:40:00 } +2024-07-25 21:30:30,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 786/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.0539694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:30,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44009 samples/s/p 3:39:42 } +2024-07-25 21:30:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 788/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 2.0533853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44039 samples/s/p 3:39:38 } +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 790/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 2.052801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43870 samples/s/p 3:39:39 } +2024-07-25 21:30:39,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 792/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.0522168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:39,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43720 samples/s/p 3:39:40 } +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 794/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.0516321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43079 samples/s/p 3:39:52 } +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 796/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.0510477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43925 samples/s/p 3:39:29 } +2024-07-25 21:30:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 798/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 2.0504633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43406 samples/s/p 3:39:39 } +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 800/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.0498783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43909 samples/s/p 3:39:23 } +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 802/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.0492935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.42993 samples/s/p 3:39:43 } +2024-07-25 21:30:57,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 804/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.0487088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:57,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43322 samples/s/p 3:39:32 } +2024-07-25 21:30:59,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 806/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.0481237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:59,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43809 samples/s/p 3:39:17 } +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 808/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.0475385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43451 samples/s/p 3:39:23 } +2024-07-25 21:31:05,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 810/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 2.0469535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:05,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43009 samples/s/p 3:39:31 } +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 812/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.0463682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:08,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43157 samples/s/p 3:39:24 } +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 814/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0457828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43614 samples/s/p 3:39:10 } +2024-07-25 21:31:14,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 816/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.0451973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:14,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43410 samples/s/p 3:39:12 } +2024-07-25 21:31:17,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 818/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.044612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:17,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43366 samples/s/p 3:39:10 } +2024-07-25 21:31:20,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 820/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.0440262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:20,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43861 samples/s/p 3:38:55 } +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 822/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0434405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43275 samples/s/p 3:39:06 } +2024-07-25 21:31:26,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 824/ 1625], loss: 1.036, per_step_time: 1476ms, lr: 2.0428546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.41903 samples/s/p 3:39:37 } +2024-07-25 21:31:29,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 826/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.0422689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:29,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43294 samples/s/p 3:39:00 } +2024-07-25 21:31:32,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 828/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0416826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:32,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43312 samples/s/p 3:38:57 } +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 830/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.0410966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43603 samples/s/p 3:38:47 } +2024-07-25 21:31:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 832/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 2.0405107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43019 samples/s/p 3:38:58 } +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 834/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0399242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:41,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.44013 samples/s/p 3:38:31 } +2024-07-25 21:31:44,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 836/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.039338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:44,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43652 samples/s/p 3:38:37 } +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 838/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.0387515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.42821 samples/s/p 3:38:54 } +2024-07-25 21:31:50,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 840/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.0381647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:50,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43037 samples/s/p 3:38:46 } +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 842/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.037578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44123 samples/s/p 3:38:17 } +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 844/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.0369915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43384 samples/s/p 3:38:31 } +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 846/ 1625], loss: 1.166, per_step_time: 1469ms, lr: 2.0364047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44277 samples/s/p 3:38:07 } +2024-07-25 21:32:01,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 848/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.035818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:01,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43207 samples/s/p 3:38:30 } +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 850/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.0352309e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43521 samples/s/p 3:38:19 } +2024-07-25 21:32:07,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 852/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.0346435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:07,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43380 samples/s/p 3:38:20 } +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 854/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 2.0340565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43629 samples/s/p 3:38:11 } +2024-07-25 21:32:13,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 856/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.0334694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43923 samples/s/p 3:38:01 } +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 858/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.032882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43872 samples/s/p 3:37:59 } +2024-07-25 21:32:19,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 860/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.0322945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:19,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43257 samples/s/p 3:38:11 } +2024-07-25 21:32:22,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 862/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.031707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:22,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43319 samples/s/p 3:38:06 } +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 864/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.0311192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43864 samples/s/p 3:37:50 } +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 866/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.0305315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43272 samples/s/p 3:38:02 } +2024-07-25 21:32:31,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 868/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 2.0299438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:31,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43082 samples/s/p 3:38:03 } +2024-07-25 21:32:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 870/ 1625], loss: 1.496, per_step_time: 1473ms, lr: 2.0293563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:34,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43081 samples/s/p 3:38:00 } +2024-07-25 21:32:37,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 872/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.0287682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:37,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43845 samples/s/p 3:37:39 } +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 874/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.0281801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:40,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.42875 samples/s/p 3:37:59 } +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 876/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 2.0275918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44543 samples/s/p 3:37:16 } +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 878/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0270036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43479 samples/s/p 3:37:39 } +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 880/ 1625], loss: 1.156, per_step_time: 1470ms, lr: 2.0264153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43927 samples/s/p 3:37:25 } +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 882/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0258269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:52,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44151 samples/s/p 3:37:17 } +2024-07-25 21:32:55,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 884/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0252384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:55,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43795 samples/s/p 3:37:23 } +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 886/ 1625], loss: 1.130, per_step_time: 1474ms, lr: 2.0246498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.42685 samples/s/p 3:37:46 } +2024-07-25 21:33:00,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 888/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.0240614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:00,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43456 samples/s/p 3:37:25 } +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 890/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.0234722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:03,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43131 samples/s/p 3:37:30 } +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 892/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 2.0228836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43565 samples/s/p 3:37:16 } +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 894/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.0222948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:09,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43696 samples/s/p 3:37:10 } +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 896/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.0217056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43599 samples/s/p 3:37:10 } +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 898/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.0211166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:15,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43820 samples/s/p 3:37:01 } +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 900/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.0205272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:18,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43666 samples/s/p 3:37:02 } +2024-07-25 21:33:21,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 902/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.019938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:21,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43536 samples/s/p 3:37:02 } +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 904/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.0193487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:24,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43497 samples/s/p 3:37:00 } +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 906/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.0187592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43502 samples/s/p 3:36:57 } +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 908/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.0181697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.42756 samples/s/p 3:37:12 } +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 910/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 2.0175801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43849 samples/s/p 3:36:43 } +2024-07-25 21:33:36,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 912/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0169902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:36,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43589 samples/s/p 3:36:46 } +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 914/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.0164005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43897 samples/s/p 3:36:36 } +2024-07-25 21:33:42,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 916/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.0158106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:42,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43416 samples/s/p 3:36:45 } +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 918/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.0152207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:45,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43345 samples/s/p 3:36:43 } +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 920/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.0146306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43929 samples/s/p 3:36:26 } +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 922/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0140405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:51,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43485 samples/s/p 3:36:34 } +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 924/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.0134501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43026 samples/s/p 3:36:42 } +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 926/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.0128598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:57,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43184 samples/s/p 3:36:35 } +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 928/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0122696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43322 samples/s/p 3:36:29 } +2024-07-25 21:34:02,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 930/ 1625], loss: 1.146, per_step_time: 1474ms, lr: 2.011679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:02,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42534 samples/s/p 3:36:45 } +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 932/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0110887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43755 samples/s/p 3:36:13 } +2024-07-25 21:34:08,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 934/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.0104979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:08,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43395 samples/s/p 3:36:19 } +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 936/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.009907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43465 samples/s/p 3:36:14 } +2024-07-25 21:34:14,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 938/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0093163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43667 samples/s/p 3:36:06 } +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 940/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 2.0087255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43763 samples/s/p 3:36:01 } +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 942/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.0081343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43343 samples/s/p 3:36:08 } +2024-07-25 21:34:23,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 944/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.0075433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:23,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43583 samples/s/p 3:35:59 } +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 946/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.0069521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43572 samples/s/p 3:35:57 } +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 948/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.0063608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43317 samples/s/p 3:36:00 } +2024-07-25 21:34:32,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 950/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.0057694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43534 samples/s/p 3:35:52 } +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 952/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.005178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:35,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43010 samples/s/p 3:36:01 } +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 954/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0045867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43549 samples/s/p 3:35:46 } +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 956/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.003995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.42958 samples/s/p 3:35:57 } +2024-07-25 21:34:44,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 958/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.0034033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:44,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43598 samples/s/p 3:35:38 } +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 960/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.0028117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.44320 samples/s/p 3:35:18 } +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 962/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0022198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:50,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43790 samples/s/p 3:35:28 } +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 964/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.0016278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43546 samples/s/p 3:35:31 } +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 966/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0010359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:56,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43182 samples/s/p 3:35:37 } +2024-07-25 21:34:59,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 968/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0004436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:59,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43659 samples/s/p 3:35:22 } +2024-07-25 21:35:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 970/ 1625], loss: 1.516, per_step_time: 1472ms, lr: 1.9998517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:01,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43144 samples/s/p 3:35:32 } +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 972/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.9992593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43147 samples/s/p 3:35:29 } +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 974/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 1.998667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43101 samples/s/p 3:35:27 } +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 976/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.9980747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43812 samples/s/p 3:35:07 } +2024-07-25 21:35:13,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 978/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.997482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:13,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43591 samples/s/p 3:35:09 } +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 980/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 1.9968895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:16,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.42962 samples/s/p 3:35:21 } +2024-07-25 21:35:19,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 982/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.9962969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:19,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43599 samples/s/p 3:35:03 } +2024-07-25 21:35:22,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 984/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9957042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:22,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43319 samples/s/p 3:35:07 } +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 986/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.995111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43056 samples/s/p 3:35:10 } +2024-07-25 21:35:28,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 988/ 1625], loss: 1.168, per_step_time: 1475ms, lr: 1.9945184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:28,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42292 samples/s/p 3:35:25 } +2024-07-25 21:35:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 990/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 1.9939254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42768 samples/s/p 3:35:11 } +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 992/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 1.9933323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43278 samples/s/p 3:34:56 } +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 994/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.992739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43327 samples/s/p 3:34:52 } +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 996/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.992146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43917 samples/s/p 3:34:35 } +2024-07-25 21:35:43,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 998/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.9915527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:43,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43724 samples/s/p 3:34:37 } +2024-07-25 21:35:46,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1000/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.9909592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:46,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44179 samples/s/p 3:34:23 } +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1002/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9903657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:49,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44070 samples/s/p 3:34:23 } +2024-07-25 21:35:52,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1004/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 1.9897721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:52,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43501 samples/s/p 3:34:33 } +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1006/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9891784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44037 samples/s/p 3:34:17 } +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1008/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.9885845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:58,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43378 samples/s/p 3:34:30 } +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1010/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.987991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43858 samples/s/p 3:34:16 } +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1012/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.987397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43327 samples/s/p 3:34:25 } +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1014/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 1.9868032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:06,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43308 samples/s/p 3:34:23 } +2024-07-25 21:36:09,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1016/ 1625], loss: 1.047, per_step_time: 1474ms, lr: 1.986209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:09,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42667 samples/s/p 3:34:35 } +2024-07-25 21:36:12,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1018/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.9856148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:12,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43323 samples/s/p 3:34:17 } +2024-07-25 21:36:15,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1020/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 1.9850208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:15,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43249 samples/s/p 3:34:15 } +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1022/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.9844263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:18,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42985 samples/s/p 3:34:19 } +2024-07-25 21:36:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1024/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.9838319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:21,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43276 samples/s/p 3:34:09 } +2024-07-25 21:36:24,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1026/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9832376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:24,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43622 samples/s/p 3:33:58 } +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1028/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.982643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43414 samples/s/p 3:34:00 } +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1030/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.9820483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:30,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43079 samples/s/p 3:34:05 } +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1032/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.9814537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43316 samples/s/p 3:33:56 } +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1034/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.980859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43714 samples/s/p 3:33:44 } +2024-07-25 21:36:39,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.9802641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:39,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43370 samples/s/p 3:33:49 } +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1038/ 1625], loss: 1.288, per_step_time: 1470ms, lr: 1.9796691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:42,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43948 samples/s/p 3:33:32 } +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1040/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.9790741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43181 samples/s/p 3:33:48 } +2024-07-25 21:36:48,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1042/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.978479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43807 samples/s/p 3:33:30 } +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1044/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.977884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.44109 samples/s/p 3:33:20 } +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1046/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.9772886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:54,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43355 samples/s/p 3:33:35 } +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1048/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.9766934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:57,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43900 samples/s/p 3:33:19 } +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1050/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.9760979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:00,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43709 samples/s/p 3:33:20 } +2024-07-25 21:37:02,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1052/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.9755025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:02,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43040 samples/s/p 3:33:33 } +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1054/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 1.974907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:05,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43669 samples/s/p 3:33:16 } +2024-07-25 21:37:08,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1056/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.9743113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43297 samples/s/p 3:33:21 } +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1058/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.9737156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43246 samples/s/p 3:33:20 } +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1060/ 1625], loss: 1.250, per_step_time: 1480ms, lr: 1.9731197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.40183 samples/s/p 3:34:29 } +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1062/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.972524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43414 samples/s/p 3:33:10 } +2024-07-25 21:37:20,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1064/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.9719278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:20,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.42892 samples/s/p 3:33:19 } +2024-07-25 21:37:23,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1066/ 1625], loss: 1.407, per_step_time: 1471ms, lr: 1.971332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43669 samples/s/p 3:32:58 } +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1068/ 1625], loss: 0.973, per_step_time: 1472ms, lr: 1.9707357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43321 samples/s/p 3:33:03 } +2024-07-25 21:37:29,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1070/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 1.9701396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:29,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.42834 samples/s/p 3:33:12 } +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1072/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 1.9695433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.44015 samples/s/p 3:32:41 } +2024-07-25 21:37:35,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1074/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.968947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:35,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43719 samples/s/p 3:32:45 } +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1076/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9683506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43480 samples/s/p 3:32:48 } +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1078/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 1.967754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43038 samples/s/p 3:32:55 } +2024-07-25 21:37:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1080/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.9671574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43827 samples/s/p 3:32:34 } +2024-07-25 21:37:47,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1082/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.966561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:47,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43820 samples/s/p 3:32:31 } +2024-07-25 21:37:50,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1084/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.9659641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:50,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43261 samples/s/p 3:32:41 } +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1086/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.9653671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43556 samples/s/p 3:32:31 } +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1088/ 1625], loss: 0.941, per_step_time: 1471ms, lr: 1.9647705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43524 samples/s/p 3:32:29 } +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1090/ 1625], loss: 1.373, per_step_time: 1472ms, lr: 1.9641735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43358 samples/s/p 3:32:30 } +2024-07-25 21:38:02,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1092/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.9635765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:02,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43905 samples/s/p 3:32:14 } +2024-07-25 21:38:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1094/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 1.9629793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43833 samples/s/p 3:32:13 } +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1096/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 1.9623822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43450 samples/s/p 3:32:19 } +2024-07-25 21:38:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1098/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.961785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43408 samples/s/p 3:32:17 } +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1100/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.9611876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43104 samples/s/p 3:32:21 } +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1102/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.9605903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43491 samples/s/p 3:32:09 } +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1104/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.9599927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:19,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43862 samples/s/p 3:31:57 } +2024-07-25 21:38:22,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1106/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.9593952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43293 samples/s/p 3:32:08 } +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1108/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 1.9587973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.44340 samples/s/p 3:31:40 } +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1110/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 1.9581998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43588 samples/s/p 3:31:55 } +2024-07-25 21:38:31,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1112/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 1.9576019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:31,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.42991 samples/s/p 3:32:06 } +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1114/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.957004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:34,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42792 samples/s/p 3:32:08 } +2024-07-25 21:38:37,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1116/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.956406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:37,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43689 samples/s/p 3:31:44 } +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1118/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.955808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43584 samples/s/p 3:31:43 } +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1120/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.95521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:43,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43152 samples/s/p 3:31:50 } +2024-07-25 21:38:46,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1122/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.954612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:46,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43614 samples/s/p 3:31:37 } +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1124/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.9540135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:49,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43182 samples/s/p 3:31:44 } +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1126/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.9534153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43031 samples/s/p 3:31:44 } +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1128/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.9528168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:55,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43074 samples/s/p 3:31:41 } +2024-07-25 21:38:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1130/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 1.9522184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.44020 samples/s/p 3:31:16 } +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1132/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.95162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:01,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43529 samples/s/p 3:31:24 } +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1134/ 1625], loss: 1.303, per_step_time: 1470ms, lr: 1.9510213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43862 samples/s/p 3:31:13 } +2024-07-25 21:39:06,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1136/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.9504225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:06,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43629 samples/s/p 3:31:16 } +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1138/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9498239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43553 samples/s/p 3:31:15 } +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1140/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.949225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43664 samples/s/p 3:31:09 } +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1142/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.948626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43672 samples/s/p 3:31:06 } +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1144/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.948027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:18,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43237 samples/s/p 3:31:13 } +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1146/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.947428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43762 samples/s/p 3:30:58 } +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1148/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.9468289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.42992 samples/s/p 3:31:13 } +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1150/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.9462297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:27,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43384 samples/s/p 3:31:01 } +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1152/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.9456304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43750 samples/s/p 3:30:49 } +2024-07-25 21:39:33,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1154/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.9450312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:33,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43820 samples/s/p 3:30:45 } +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1156/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.9444315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43607 samples/s/p 3:30:47 } +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1158/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.9438321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43662 samples/s/p 3:30:43 } +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1160/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.9432326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.44018 samples/s/p 3:30:31 } +2024-07-25 21:39:45,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1162/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.942633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:45,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.44119 samples/s/p 3:30:26 } +2024-07-25 21:39:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1164/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.942033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43130 samples/s/p 3:30:46 } +2024-07-25 21:39:51,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1166/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.9414336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:51,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43660 samples/s/p 3:30:31 } +2024-07-25 21:39:54,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1168/ 1625], loss: 1.320, per_step_time: 1470ms, lr: 1.9408335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:54,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43935 samples/s/p 3:30:22 } +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1170/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.9402336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43629 samples/s/p 3:30:26 } +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1172/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 1.9396337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:00,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43010 samples/s/p 3:30:37 } +2024-07-25 21:40:03,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1174/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.9390336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:03,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43084 samples/s/p 3:30:33 } +2024-07-25 21:40:05,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1176/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9384335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:05,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43694 samples/s/p 3:30:15 } +2024-07-25 21:40:08,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1178/ 1625], loss: 1.039, per_step_time: 1474ms, lr: 1.9378333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:08,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.42555 samples/s/p 3:30:39 } +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1180/ 1625], loss: 1.450, per_step_time: 1472ms, lr: 1.9372328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43474 samples/s/p 3:30:15 } +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1182/ 1625], loss: 1.337, per_step_time: 1470ms, lr: 1.9366327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43912 samples/s/p 3:30:02 } +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.9360323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43526 samples/s/p 3:30:08 } +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1186/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.9354316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43814 samples/s/p 3:29:58 } +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1188/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 1.934831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.44463 samples/s/p 3:29:40 } +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1190/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.9342304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43438 samples/s/p 3:30:01 } +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1192/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.9336298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43732 samples/s/p 3:29:51 } +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1194/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.933029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43331 samples/s/p 3:29:57 } +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1196/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.9324281e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43249 samples/s/p 3:29:56 } +2024-07-25 21:40:38,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1198/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.9318273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:38,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43355 samples/s/p 3:29:51 } +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1200/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.9312261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43237 samples/s/p 3:29:51 } +2024-07-25 21:40:44,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1202/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.930625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:44,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43949 samples/s/p 3:29:31 } +2024-07-25 21:40:47,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1204/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.930024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.42944 samples/s/p 3:29:52 } +2024-07-25 21:40:50,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1206/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.9294228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:50,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44201 samples/s/p 3:29:20 } +2024-07-25 21:40:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1208/ 1625], loss: 0.975, per_step_time: 1469ms, lr: 1.9288214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44252 samples/s/p 3:29:15 } +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1210/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.92822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43531 samples/s/p 3:29:29 } +2024-07-25 21:40:59,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1212/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.9276187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44176 samples/s/p 3:29:11 } +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1214/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.9270172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43374 samples/s/p 3:29:27 } +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1216/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.9264156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43405 samples/s/p 3:29:23 } +2024-07-25 21:41:07,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1218/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.925814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43511 samples/s/p 3:29:18 } +2024-07-25 21:41:10,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1220/ 1625], loss: 1.007, per_step_time: 1473ms, lr: 1.9252126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:10,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.42934 samples/s/p 3:29:28 } +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1222/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9246108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43628 samples/s/p 3:29:09 } +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1224/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.9240086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43815 samples/s/p 3:29:02 } +2024-07-25 21:41:19,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1226/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.9234069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:19,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44285 samples/s/p 3:28:48 } +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1228/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.922805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:22,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43512 samples/s/p 3:29:03 } +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1230/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.9222029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.44106 samples/s/p 3:28:46 } +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1232/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9216008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:28,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43784 samples/s/p 3:28:51 } +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1234/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.9209985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43757 samples/s/p 3:28:49 } +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1236/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.9203962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:34,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43609 samples/s/p 3:28:49 } +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1238/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.919794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43836 samples/s/p 3:28:41 } +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1240/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.9191915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43436 samples/s/p 3:28:47 } +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1242/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.918589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:43,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43419 samples/s/p 3:28:45 } +2024-07-25 21:41:46,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1244/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:46,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.44175 samples/s/p 3:28:24 } +2024-07-25 21:41:49,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1246/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.917384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:49,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43465 samples/s/p 3:28:38 } +2024-07-25 21:41:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1248/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.9167815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43128 samples/s/p 3:28:43 } +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1250/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.9161786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:55,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43929 samples/s/p 3:28:21 } +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1252/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.915576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43142 samples/s/p 3:28:36 } +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1254/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.914973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:01,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43628 samples/s/p 3:28:22 } +2024-07-25 21:42:03,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1256/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9143701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:03,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43180 samples/s/p 3:28:30 } +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1258/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.913767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43801 samples/s/p 3:28:12 } +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1260/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 1.9131641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44239 samples/s/p 3:27:59 } +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1262/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.9125608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:12,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43975 samples/s/p 3:28:02 } +2024-07-25 21:42:15,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1264/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.9119578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:15,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.42884 samples/s/p 3:28:25 } +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1266/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.9113546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:18,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43621 samples/s/p 3:28:05 } +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1268/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.910751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:21,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44054 samples/s/p 3:27:52 } +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.9101477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43675 samples/s/p 3:27:58 } +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1272/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 1.9095443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43714 samples/s/p 3:27:54 } +2024-07-25 21:42:30,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1274/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.9089408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:30,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43305 samples/s/p 3:28:00 } +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1276/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.908337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43634 samples/s/p 3:27:50 } +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1278/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.9077335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42951 samples/s/p 3:28:02 } +2024-07-25 21:42:39,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1280/ 1625], loss: 0.998, per_step_time: 1473ms, lr: 1.9071298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:39,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42990 samples/s/p 3:27:59 } +2024-07-25 21:42:42,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1282/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.9065259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:42,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43726 samples/s/p 3:27:39 } +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1284/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.9059222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43611 samples/s/p 3:27:38 } +2024-07-25 21:42:48,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1286/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.9053183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:48,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.44112 samples/s/p 3:27:24 } +2024-07-25 21:42:51,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1288/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 1.9047144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:51,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43708 samples/s/p 3:27:30 } +2024-07-25 21:42:54,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1290/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9041101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43825 samples/s/p 3:27:25 } +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1292/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9035058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43546 samples/s/p 3:27:28 } +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1294/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 1.902902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:00,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.42728 samples/s/p 3:27:44 } +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1296/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.9022977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:02,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43911 samples/s/p 3:27:14 } +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1298/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 1.9016934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43764 samples/s/p 3:27:14 } +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1300/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.901089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:08,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43398 samples/s/p 3:27:20 } +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1302/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.9004845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:11,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.42899 samples/s/p 3:27:28 } +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1304/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.8998799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43312 samples/s/p 3:27:16 } +2024-07-25 21:43:17,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1306/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 1.8992752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:17,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.44169 samples/s/p 3:26:53 } +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1308/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.8986706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43173 samples/s/p 3:27:13 } +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1310/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 1.8980661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:23,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42833 samples/s/p 3:27:18 } +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1312/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.8974612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43720 samples/s/p 3:26:55 } +2024-07-25 21:43:29,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1314/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.8968563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:29,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43575 samples/s/p 3:26:55 } +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1316/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8962515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42872 samples/s/p 3:27:08 } +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1318/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.8956465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:35,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43641 samples/s/p 3:26:48 } +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1320/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.8950414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43177 samples/s/p 3:26:55 } +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1322/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.8944364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:41,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43350 samples/s/p 3:26:48 } +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1324/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8938314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:44,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42945 samples/s/p 3:26:55 } +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1326/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.8932262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42961 samples/s/p 3:26:51 } +2024-07-25 21:43:50,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1328/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.8926208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:50,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43218 samples/s/p 3:26:43 } +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.8920155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44135 samples/s/p 3:26:19 } +2024-07-25 21:43:56,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1332/ 1625], loss: 1.164, per_step_time: 1474ms, lr: 1.8914103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:56,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42673 samples/s/p 3:26:49 } +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1334/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.8908046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44110 samples/s/p 3:26:13 } +2024-07-25 21:44:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1336/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 1.890199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43936 samples/s/p 3:26:14 } +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1338/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 1.8895937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43382 samples/s/p 3:26:24 } +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1340/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 1.888988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:07,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43099 samples/s/p 3:26:28 } +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1342/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.888382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43900 samples/s/p 3:26:06 } +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1344/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.8877763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43345 samples/s/p 3:26:16 } +2024-07-25 21:44:16,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.8871706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:16,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43444 samples/s/p 3:26:11 } +2024-07-25 21:44:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1348/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.8865647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43150 samples/s/p 3:26:15 } +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1350/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.8859586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43696 samples/s/p 3:25:59 } +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1352/ 1625], loss: 1.028, per_step_time: 1474ms, lr: 1.8853527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42612 samples/s/p 3:26:21 } +2024-07-25 21:44:28,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1354/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 1.8847466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:28,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43505 samples/s/p 3:25:58 } +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1356/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 1.8841405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42789 samples/s/p 3:26:11 } +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1358/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.883534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43321 samples/s/p 3:25:56 } +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1360/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.882928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:37,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43433 samples/s/p 3:25:51 } +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1362/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.8823217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43565 samples/s/p 3:25:45 } +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1364/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.8817153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:43,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43549 samples/s/p 3:25:42 } +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1366/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8811088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.42847 samples/s/p 3:25:55 } +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1368/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.8805022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:49,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43418 samples/s/p 3:25:39 } +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1370/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.8798957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43914 samples/s/p 3:25:25 } +2024-07-25 21:44:55,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1372/ 1625], loss: 1.286, per_step_time: 1469ms, lr: 1.8792889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:55,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.44255 samples/s/p 3:25:14 } +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1374/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.8786823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:58,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43556 samples/s/p 3:25:27 } +2024-07-25 21:45:01,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1376/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.8780756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:01,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43347 samples/s/p 3:25:29 } +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1378/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.8774688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:03,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43864 samples/s/p 3:25:14 } +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1380/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 1.8768616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43697 samples/s/p 3:25:15 } +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1382/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 1.876255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43310 samples/s/p 3:25:21 } +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1384/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.875648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43835 samples/s/p 3:25:06 } +2024-07-25 21:45:15,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1386/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 1.8750408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:15,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43175 samples/s/p 3:25:18 } +2024-07-25 21:45:18,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1388/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.8744337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:18,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43313 samples/s/p 3:25:12 } +2024-07-25 21:45:21,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1390/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8738265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:21,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43335 samples/s/p 3:25:09 } +2024-07-25 21:45:24,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1392/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.8732191e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:24,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43244 samples/s/p 3:25:08 } +2024-07-25 21:45:27,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1394/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 1.872612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.44018 samples/s/p 3:24:47 } +2024-07-25 21:45:30,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1396/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 1.8720046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:30,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43138 samples/s/p 3:25:04 } +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1398/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.8713974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43241 samples/s/p 3:24:59 } +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1400/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43123 samples/s/p 3:24:59 } +2024-07-25 21:45:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1402/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.870182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43396 samples/s/p 3:24:50 } +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1404/ 1625], loss: 0.955, per_step_time: 1470ms, lr: 1.8695746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.44070 samples/s/p 3:24:31 } +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1406/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 1.8689669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:45,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.42980 samples/s/p 3:24:53 } +2024-07-25 21:45:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1408/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.8683593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:48,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43411 samples/s/p 3:24:40 } +2024-07-25 21:45:51,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1410/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.8677512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43885 samples/s/p 3:24:27 } +2024-07-25 21:45:54,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.8671435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43461 samples/s/p 3:24:33 } +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1414/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.8665356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:57,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43172 samples/s/p 3:24:37 } +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.8659277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43709 samples/s/p 3:24:22 } +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1418/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.8653196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:03,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43045 samples/s/p 3:24:34 } +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1420/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.8647115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43744 samples/s/p 3:24:15 } +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8641036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:08,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43208 samples/s/p 3:24:24 } +2024-07-25 21:46:11,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1424/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8634952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:11,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43760 samples/s/p 3:24:09 } +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1426/ 1625], loss: 0.986, per_step_time: 1473ms, lr: 1.862887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42879 samples/s/p 3:24:26 } +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1474ms, lr: 1.8622788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42646 samples/s/p 3:24:28 } +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1430/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.8616704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:20,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43206 samples/s/p 3:24:13 } +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1432/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.861062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43508 samples/s/p 3:24:03 } +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1434/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.8604534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43609 samples/s/p 3:23:58 } +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1436/ 1625], loss: 0.952, per_step_time: 1473ms, lr: 1.859845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:29,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43001 samples/s/p 3:24:08 } +2024-07-25 21:46:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1438/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 1.8592364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43113 samples/s/p 3:24:03 } +2024-07-25 21:46:35,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1440/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8586277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:35,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43262 samples/s/p 3:23:57 } +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1442/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.858019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:38,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43752 samples/s/p 3:23:43 } +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1444/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.8574103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43364 samples/s/p 3:23:49 } +2024-07-25 21:46:44,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1446/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.8568015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44091 samples/s/p 3:23:29 } +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1448/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.8561926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44017 samples/s/p 3:23:28 } +2024-07-25 21:46:50,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1450/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.8555837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:50,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43366 samples/s/p 3:23:40 } +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1452/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 1.8549747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43379 samples/s/p 3:23:36 } +2024-07-25 21:46:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1454/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8543657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43945 samples/s/p 3:23:21 } +2024-07-25 21:46:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1456/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.8537567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:59,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43310 samples/s/p 3:23:32 } +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1458/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.8531473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43594 samples/s/p 3:23:23 } +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1460/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.8525381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43846 samples/s/p 3:23:14 } +2024-07-25 21:47:07,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1462/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.8519288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43803 samples/s/p 3:23:12 } +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1464/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.8513196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:10,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43677 samples/s/p 3:23:12 } +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1466/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.8507104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:13,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43677 samples/s/p 3:23:09 } +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1468/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.8501007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:16,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.44414 samples/s/p 3:22:50 } +2024-07-25 21:47:19,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1470/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 1.8494913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:19,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43916 samples/s/p 3:22:58 } +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1472/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.8488818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:22,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43131 samples/s/p 3:23:13 } +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1474/ 1625], loss: 1.323, per_step_time: 1469ms, lr: 1.848272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44336 samples/s/p 3:22:43 } +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1476/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.8476625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:28,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43262 samples/s/p 3:23:04 } +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1478/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 1.8470528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.42981 samples/s/p 3:23:07 } +2024-07-25 21:47:34,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1480/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 1.846443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:34,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43001 samples/s/p 3:23:04 } +2024-07-25 21:47:37,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1482/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.8458331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44211 samples/s/p 3:22:34 } +2024-07-25 21:47:40,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1484/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.8452232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:40,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43615 samples/s/p 3:22:44 } +2024-07-25 21:47:43,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1486/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.8446133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:43,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43304 samples/s/p 3:22:48 } +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1488/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.8440034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43559 samples/s/p 3:22:39 } +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1490/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 1.8433933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:49,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.42833 samples/s/p 3:22:53 } +2024-07-25 21:47:52,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1492/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.8427832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:52,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43843 samples/s/p 3:22:27 } +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1494/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.8421732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:55,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43636 samples/s/p 3:22:29 } +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1496/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.841563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:58,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43909 samples/s/p 3:22:20 } +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1498/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.8409528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43716 samples/s/p 3:22:21 } +2024-07-25 21:48:04,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1500/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 1.8403425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:04,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43512 samples/s/p 3:22:23 } +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1502/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.839732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43411 samples/s/p 3:22:22 } +2024-07-25 21:48:09,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1504/ 1625], loss: 1.385, per_step_time: 1473ms, lr: 1.8391216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:09,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43055 samples/s/p 3:22:27 } +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1506/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8385112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44109 samples/s/p 3:22:01 } +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1508/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.8379005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43660 samples/s/p 3:22:08 } +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1510/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.8372903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:18,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43804 samples/s/p 3:22:02 } +2024-07-25 21:48:21,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1512/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8366794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43414 samples/s/p 3:22:07 } +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.8360686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43191 samples/s/p 3:22:09 } +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1516/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 1.8354582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44141 samples/s/p 3:21:45 } +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.8348474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43334 samples/s/p 3:22:00 } +2024-07-25 21:48:33,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1520/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.8342364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:33,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43805 samples/s/p 3:21:47 } +2024-07-25 21:48:36,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1522/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.8336255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43618 samples/s/p 3:21:48 } +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1524/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.8330145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43528 samples/s/p 3:21:47 } +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1526/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.8324039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:42,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43711 samples/s/p 3:21:40 } +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1528/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 1.8317924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43576 samples/s/p 3:21:40 } +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1530/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 1.8311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43556 samples/s/p 3:21:38 } +2024-07-25 21:48:51,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1532/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.8305704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:51,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43818 samples/s/p 3:21:29 } +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1534/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 1.8299592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:54,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.44215 samples/s/p 3:21:17 } +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1536/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.8293478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43744 samples/s/p 3:21:25 } +2024-07-25 21:49:00,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1538/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 1.8287366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43776 samples/s/p 3:21:21 } +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1540/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 1.8281251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43083 samples/s/p 3:21:33 } +2024-07-25 21:49:05,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1542/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.8275137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:05,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43537 samples/s/p 3:21:20 } +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1544/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.8269022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43363 samples/s/p 3:21:21 } +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1546/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.8262908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43521 samples/s/p 3:21:15 } +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1548/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 1.8256795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43278 samples/s/p 3:21:17 } +2024-07-25 21:49:17,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1550/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.8250676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:17,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43210 samples/s/p 3:21:16 } +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1552/ 1625], loss: 0.950, per_step_time: 1470ms, lr: 1.824456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:20,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44114 samples/s/p 3:20:53 } +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1554/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.8238445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:23,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43471 samples/s/p 3:21:04 } +2024-07-25 21:49:26,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1556/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.8232326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:26,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43441 samples/s/p 3:21:02 } +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1558/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.8226207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43245 samples/s/p 3:21:03 } +2024-07-25 21:49:32,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1560/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.822009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:32,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43795 samples/s/p 3:20:48 } +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1562/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 1.8213968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43641 samples/s/p 3:20:49 } +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1564/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 1.820785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:38,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.42632 samples/s/p 3:21:08 } +2024-07-25 21:49:41,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1566/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.8201728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:41,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43490 samples/s/p 3:20:46 } +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1568/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.8195607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44154 samples/s/p 3:20:28 } +2024-07-25 21:49:47,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1570/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.8189487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:47,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43729 samples/s/p 3:20:35 } +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1572/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8183366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43196 samples/s/p 3:20:44 } +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1574/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.8177245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43422 samples/s/p 3:20:36 } +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1576/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 1.8171122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43476 samples/s/p 3:20:32 } +2024-07-25 21:49:59,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1578/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 1.8165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:59,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43683 samples/s/p 3:20:24 } +2024-07-25 21:50:02,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1580/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.8158873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:02,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43853 samples/s/p 3:20:17 } +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1582/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 1.815275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43985 samples/s/p 3:20:12 } +2024-07-25 21:50:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1584/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.8146626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:07,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43690 samples/s/p 3:20:15 } +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1586/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.8140501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43988 samples/s/p 3:20:06 } +2024-07-25 21:50:13,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1588/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.8134375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43020 samples/s/p 3:20:24 } +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1590/ 1625], loss: 1.226, per_step_time: 1469ms, lr: 1.8128248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.44296 samples/s/p 3:19:53 } +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1592/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.8122122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43811 samples/s/p 3:20:01 } +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1594/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 1.8115996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:22,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43305 samples/s/p 3:20:09 } +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1596/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 1.8109868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43638 samples/s/p 3:19:59 } +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1598/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8103741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43469 samples/s/p 3:19:59 } +2024-07-25 21:50:31,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1600/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.8097613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43148 samples/s/p 3:20:04 } +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1602/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.8091481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43646 samples/s/p 3:19:50 } +2024-07-25 21:50:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1604/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8085353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43420 samples/s/p 3:19:52 } +2024-07-25 21:50:40,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1606/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.8079225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:40,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43646 samples/s/p 3:19:44 } +2024-07-25 21:50:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1608/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8073093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43549 samples/s/p 3:19:43 } +2024-07-25 21:50:46,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1610/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.8066961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:46,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43811 samples/s/p 3:19:34 } +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1612/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.8060831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43643 samples/s/p 3:19:35 } +2024-07-25 21:50:52,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1614/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.8054698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:52,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43713 samples/s/p 3:19:31 } +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1616/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.8048568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:55,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43382 samples/s/p 3:19:35 } +2024-07-25 21:50:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1618/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.8042434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43447 samples/s/p 3:19:30 } +2024-07-25 21:51:01,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1620/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.8036299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:01,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44198 samples/s/p 3:19:11 } +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1622/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8030169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43391 samples/s/p 3:19:26 } +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1624/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.8024031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44225 samples/s/p 3:19:05 } +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.80179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43670 samples/s/p 3:19:14 } +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 3/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.8011764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:12,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43629 samples/s/p 3:19:12 } +2024-07-25 21:51:15,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 5/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.8005629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43323 samples/s/p 3:19:16 } +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 7/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7999491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43760 samples/s/p 3:19:03 } +2024-07-25 21:51:21,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 9/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.7993356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:21,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43376 samples/s/p 3:19:09 } +2024-07-25 21:51:24,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 11/ 1625], loss: 1.096, per_step_time: 1469ms, lr: 1.7987217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:24,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.44277 samples/s/p 3:18:46 } +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 13/ 1625], loss: 1.056, per_step_time: 1475ms, lr: 1.798108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42025 samples/s/p 3:19:32 } +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 15/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.7974944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43360 samples/s/p 3:19:00 } +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 17/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.7968803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43845 samples/s/p 3:18:46 } +2024-07-25 21:51:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 19/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.7962668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:36,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42990 samples/s/p 3:19:02 } +2024-07-25 21:51:39,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 21/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.7956525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43803 samples/s/p 3:18:41 } +2024-07-25 21:51:42,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 23/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 1.7950388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:42,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43518 samples/s/p 3:18:45 } +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 25/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.7944249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43914 samples/s/p 3:18:33 } +2024-07-25 21:51:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 27/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7938106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43944 samples/s/p 3:18:30 } +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 29/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7931965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43454 samples/s/p 3:18:37 } +2024-07-25 21:51:54,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 31/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.7925824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:54,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43351 samples/s/p 3:18:37 } +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 33/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.7919681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43239 samples/s/p 3:18:36 } +2024-07-25 21:52:00,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 35/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 1.7913539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:00,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43087 samples/s/p 3:18:37 } +2024-07-25 21:52:03,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 37/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7907396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:03,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43033 samples/s/p 3:18:35 } +2024-07-25 21:52:05,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 39/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.7901253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:05,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43583 samples/s/p 3:18:20 } +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 41/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.789511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43462 samples/s/p 3:18:19 } +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 43/ 1625], loss: 1.354, per_step_time: 1470ms, lr: 1.7888964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44199 samples/s/p 3:18:00 } +2024-07-25 21:52:14,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 45/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 1.788282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:14,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43992 samples/s/p 3:18:02 } +2024-07-25 21:52:17,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 47/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.7876677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:17,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43320 samples/s/p 3:18:14 } +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 49/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.787053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43543 samples/s/p 3:18:06 } +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 51/ 1625], loss: 1.256, per_step_time: 1474ms, lr: 1.7864384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.42431 samples/s/p 3:18:27 } +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 53/ 1625], loss: 1.194, per_step_time: 1469ms, lr: 1.7858238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44564 samples/s/p 3:17:38 } +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 55/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.7852091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:29,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43510 samples/s/p 3:17:58 } +2024-07-25 21:52:32,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 57/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7845947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43630 samples/s/p 3:17:52 } +2024-07-25 21:52:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 59/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.7839797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43150 samples/s/p 3:18:00 } +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 61/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 1.7833649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.42981 samples/s/p 3:18:01 } +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 63/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.78275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43100 samples/s/p 3:17:55 } +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 65/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.7821352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43866 samples/s/p 3:17:35 } +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 67/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.78152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43797 samples/s/p 3:17:34 } +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 69/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.7809052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43687 samples/s/p 3:17:33 } +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 71/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.7802902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43843 samples/s/p 3:17:27 } +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 73/ 1625], loss: 1.242, per_step_time: 1482ms, lr: 1.7796752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:56,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.39700 samples/s/p 3:18:55 } +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 75/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.77906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43976 samples/s/p 3:17:18 } +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 77/ 1625], loss: 0.873, per_step_time: 1470ms, lr: 1.7784449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44155 samples/s/p 3:17:11 } +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 79/ 1625], loss: 1.275, per_step_time: 1470ms, lr: 1.7778299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43882 samples/s/p 3:17:14 } +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 81/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 1.7772145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44353 samples/s/p 3:17:01 } +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 83/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 1.7765991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43891 samples/s/p 3:17:08 } +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 85/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.775984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43412 samples/s/p 3:17:16 } +2024-07-25 21:53:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 87/ 1625], loss: 1.158, per_step_time: 1469ms, lr: 1.7753686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44327 samples/s/p 3:16:53 } +2024-07-25 21:53:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 89/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.774753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:19,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43388 samples/s/p 3:17:10 } +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 91/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 1.7741377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.44286 samples/s/p 3:16:48 } +2024-07-25 21:53:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 93/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.7735223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:25,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43398 samples/s/p 3:17:04 } +2024-07-25 21:53:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 95/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.7729066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43288 samples/s/p 3:17:04 } +2024-07-25 21:53:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 97/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.772291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43293 samples/s/p 3:17:01 } +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 99/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.7716755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:34,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43109 samples/s/p 3:17:02 } +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 101/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.77106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43780 samples/s/p 3:16:44 } +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 103/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.7704442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43765 samples/s/p 3:16:42 } +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 105/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 1.7698285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:43,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43452 samples/s/p 3:16:46 } +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 107/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7692128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.44023 samples/s/p 3:16:30 } +2024-07-25 21:53:49,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 109/ 1625], loss: 1.241, per_step_time: 1470ms, lr: 1.768597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43870 samples/s/p 3:16:31 } +2024-07-25 21:53:52,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 111/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.767981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:52,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43472 samples/s/p 3:16:36 } +2024-07-25 21:53:55,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 113/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 1.7673652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:55,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43569 samples/s/p 3:16:31 } +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 115/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.7667493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43133 samples/s/p 3:16:38 } +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 117/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.7661332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43141 samples/s/p 3:16:35 } +2024-07-25 21:54:03,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 119/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.7655173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43408 samples/s/p 3:16:26 } +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 121/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.764901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43039 samples/s/p 3:16:31 } +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 123/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 1.7642853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43256 samples/s/p 3:16:23 } +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.763669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43063 samples/s/p 3:16:24 } +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 127/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 1.7630528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43855 samples/s/p 3:16:04 } +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 129/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.7624367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:18,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43102 samples/s/p 3:16:18 } +2024-07-25 21:54:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 131/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.7618206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43285 samples/s/p 3:16:11 } +2024-07-25 21:54:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 133/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.761204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.42907 samples/s/p 3:16:16 } +2024-07-25 21:54:27,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 135/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7605877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43345 samples/s/p 3:16:04 } +2024-07-25 21:54:30,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 137/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.7599716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:30,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43143 samples/s/p 3:16:05 } +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 139/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.759355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43790 samples/s/p 3:15:48 } +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 141/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.7587385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:36,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43777 samples/s/p 3:15:45 } +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 143/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7581222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:39,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43632 samples/s/p 3:15:46 } +2024-07-25 21:54:42,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 145/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 1.7575056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43851 samples/s/p 3:15:38 } +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 147/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.756889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43431 samples/s/p 3:15:44 } +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 149/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.7562725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:48,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43547 samples/s/p 3:15:39 } +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 151/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.7556558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43600 samples/s/p 3:15:35 } +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 153/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.7550392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:54,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43727 samples/s/p 3:15:29 } +2024-07-25 21:54:57,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 155/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.7544224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:57,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43301 samples/s/p 3:15:35 } +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 157/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 1.7538056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.41719 samples/s/p 3:16:06 } +2024-07-25 21:55:03,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 159/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.753189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43754 samples/s/p 3:15:20 } +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 161/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.7525721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:05,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43235 samples/s/p 3:15:28 } +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 163/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.7519553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:08,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43516 samples/s/p 3:15:19 } +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 165/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7513383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43773 samples/s/p 3:15:10 } +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 167/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.7507215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:14,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43042 samples/s/p 3:15:23 } +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 169/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.7501043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43516 samples/s/p 3:15:10 } +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 171/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7494875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:20,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43407 samples/s/p 3:15:09 } +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 173/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.7488705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43657 samples/s/p 3:15:01 } +2024-07-25 21:55:26,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 175/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.7482535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:26,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.44301 samples/s/p 3:14:44 } +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 177/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.7476359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43378 samples/s/p 3:15:01 } +2024-07-25 21:55:32,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 179/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.747019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42793 samples/s/p 3:15:11 } +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 181/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.7464017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43223 samples/s/p 3:14:59 } +2024-07-25 21:55:38,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 183/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.7457845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:38,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43603 samples/s/p 3:14:47 } +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 185/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 1.7451674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42599 samples/s/p 3:15:06 } +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 187/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.74455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43328 samples/s/p 3:14:47 } +2024-07-25 21:55:47,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 189/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 1.7439326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:47,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43711 samples/s/p 3:14:36 } +2024-07-25 21:55:50,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 191/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.7433153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43950 samples/s/p 3:14:28 } +2024-07-25 21:55:53,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 193/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7426979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:53,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43309 samples/s/p 3:14:39 } +2024-07-25 21:55:56,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 195/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.7420805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:56,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43682 samples/s/p 3:14:28 } +2024-07-25 21:55:59,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 197/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.741463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:59,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44040 samples/s/p 3:14:17 } +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 199/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.7408454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43552 samples/s/p 3:14:25 } +2024-07-25 21:56:05,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 201/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.740228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:05,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43253 samples/s/p 3:14:28 } +2024-07-25 21:56:07,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 203/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.7396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:07,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44072 samples/s/p 3:14:08 } +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 205/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.7389928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43045 samples/s/p 3:14:27 } +2024-07-25 21:56:13,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 207/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7383752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:13,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43590 samples/s/p 3:14:12 } +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 209/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.7377573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43688 samples/s/p 3:14:07 } +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 211/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.7371396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43315 samples/s/p 3:14:12 } +2024-07-25 21:56:22,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 213/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 1.7365219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:22,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43135 samples/s/p 3:14:13 } +2024-07-25 21:56:25,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 215/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.735904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:25,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43330 samples/s/p 3:14:06 } +2024-07-25 21:56:28,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 217/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.7352862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:28,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43056 samples/s/p 3:14:09 } +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 219/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7346685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43500 samples/s/p 3:13:57 } +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 221/ 1625], loss: 1.076, per_step_time: 1473ms, lr: 1.7340506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42941 samples/s/p 3:14:06 } +2024-07-25 21:56:37,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 223/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.7334327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:37,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43403 samples/s/p 3:13:53 } +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 225/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.7328146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:40,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43854 samples/s/p 3:13:40 } +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 227/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.7321967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42455 samples/s/p 3:14:07 } +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 229/ 1625], loss: 0.899, per_step_time: 1471ms, lr: 1.7315788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:46,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43510 samples/s/p 3:13:42 } +2024-07-25 21:56:49,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 231/ 1625], loss: 0.989, per_step_time: 1469ms, lr: 1.7309607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:49,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.44379 samples/s/p 3:13:20 } +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 233/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7303424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43743 samples/s/p 3:13:31 } +2024-07-25 21:56:55,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 235/ 1625], loss: 1.290, per_step_time: 1470ms, lr: 1.7297245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:55,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43923 samples/s/p 3:13:24 } +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 237/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.729106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44008 samples/s/p 3:13:19 } +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 239/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.728488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43172 samples/s/p 3:13:34 } +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 241/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.7278699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43276 samples/s/p 3:13:29 } +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 243/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.7272516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43264 samples/s/p 3:13:26 } +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 245/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.7266331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43908 samples/s/p 3:13:10 } +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 247/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7260149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44149 samples/s/p 3:13:02 } +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 249/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.7253966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43735 samples/s/p 3:13:07 } +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 251/ 1625], loss: 1.072, per_step_time: 1469ms, lr: 1.7247781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44222 samples/s/p 3:12:54 } +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 253/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.7241597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:21,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43191 samples/s/p 3:13:13 } +2024-07-25 21:57:24,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 255/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.7235412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44042 samples/s/p 3:12:52 } +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 257/ 1625], loss: 1.069, per_step_time: 1474ms, lr: 1.722923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.42514 samples/s/p 3:13:22 } +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 259/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 1.7223043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44017 samples/s/p 3:12:47 } +2024-07-25 21:57:33,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 261/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.7216857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:33,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43156 samples/s/p 3:13:02 } +2024-07-25 21:57:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 263/ 1625], loss: 1.325, per_step_time: 1470ms, lr: 1.7210672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:36,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44022 samples/s/p 3:12:41 } +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 265/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.7204486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43840 samples/s/p 3:12:42 } +2024-07-25 21:57:42,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 267/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.7198297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:42,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43373 samples/s/p 3:12:49 } +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 269/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.7192113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:45,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43680 samples/s/p 3:12:39 } +2024-07-25 21:57:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 271/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 1.7185926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:48,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43456 samples/s/p 3:12:41 } +2024-07-25 21:57:51,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 273/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 1.7179738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43792 samples/s/p 3:12:31 } +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 275/ 1625], loss: 1.379, per_step_time: 1470ms, lr: 1.717355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43922 samples/s/p 3:12:25 } +2024-07-25 21:57:54,186 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 277/ 1625], loss: 1.121, per_step_time: 1544ms, lr: 1.7167362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:30,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.18035 samples/s/p 3:21:59 } +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 279/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.7161175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43063 samples/s/p 3:12:38 } +2024-07-25 21:58:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 281/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.7154985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:36,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43708 samples/s/p 3:12:21 } +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 283/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.7148795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:39,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43755 samples/s/p 3:12:17 } +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 285/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.7142607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44142 samples/s/p 3:12:06 } +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 287/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.7136417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43284 samples/s/p 3:12:21 } +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 289/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.7130225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43851 samples/s/p 3:12:06 } +2024-07-25 21:58:50,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 291/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.7124037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:50,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43393 samples/s/p 3:12:13 } +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 293/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 1.7117847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:53,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44031 samples/s/p 3:11:56 } +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 295/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 1.7111655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43919 samples/s/p 3:11:56 } +2024-07-25 21:58:59,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 297/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.7105465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:59,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43761 samples/s/p 3:11:56 } +2024-07-25 21:59:02,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 299/ 1625], loss: 0.974, per_step_time: 1471ms, lr: 1.7099273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:02,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43480 samples/s/p 3:11:59 } +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 301/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 1.7093083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44098 samples/s/p 3:11:43 } +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 303/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.708689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43583 samples/s/p 3:11:51 } +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 305/ 1625], loss: 1.362, per_step_time: 1469ms, lr: 1.7080698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:11,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44530 samples/s/p 3:11:28 } +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 307/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.7074506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43698 samples/s/p 3:11:43 } +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 309/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.7068312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43520 samples/s/p 3:11:44 } +2024-07-25 21:59:20,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 311/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.7062119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:20,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43902 samples/s/p 3:11:33 } +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 313/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.7055927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:23,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43726 samples/s/p 3:11:34 } +2024-07-25 21:59:26,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 315/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 1.7049733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:26,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43267 samples/s/p 3:11:40 } +2024-07-25 21:59:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 317/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.704354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:29,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43237 samples/s/p 3:11:38 } +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 319/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.7037344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43812 samples/s/p 3:11:23 } +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1474ms, lr: 1.703115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.42571 samples/s/p 3:11:46 } +2024-07-25 21:59:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 323/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.7024955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43377 samples/s/p 3:11:26 } +2024-07-25 21:59:41,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 325/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 1.701876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:41,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43850 samples/s/p 3:11:13 } +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 327/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.7012564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43630 samples/s/p 3:11:15 } +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 329/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.7006369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43970 samples/s/p 3:11:05 } +2024-07-25 21:59:49,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 331/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.7000175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:49,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43475 samples/s/p 3:11:12 } +2024-07-25 21:59:52,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 333/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.6993976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:52,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43713 samples/s/p 3:11:04 } +2024-07-25 21:59:55,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 335/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.698778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:55,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43805 samples/s/p 3:10:59 } +2024-07-25 21:59:58,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 337/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 1.6981583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:58,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43997 samples/s/p 3:10:53 } +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 339/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.6975388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43700 samples/s/p 3:10:56 } +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 341/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.6969188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:04,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43768 samples/s/p 3:10:51 } +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 343/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.6962991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43770 samples/s/p 3:10:48 } +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 345/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.6956794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:10,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43953 samples/s/p 3:10:42 } +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 347/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6950595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43229 samples/s/p 3:10:54 } +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 349/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.6944396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43631 samples/s/p 3:10:43 } +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 351/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.69382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:19,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43826 samples/s/p 3:10:36 } +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 353/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.6932001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43474 samples/s/p 3:10:40 } +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 355/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.69258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43823 samples/s/p 3:10:30 } +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 357/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.6919603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:28,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43537 samples/s/p 3:10:33 } +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 359/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.6913402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43759 samples/s/p 3:10:25 } +2024-07-25 22:00:34,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 361/ 1625], loss: 1.336, per_step_time: 1471ms, lr: 1.6907201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:34,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43579 samples/s/p 3:10:26 } +2024-07-25 22:00:37,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 363/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.6901002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:37,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.44010 samples/s/p 3:10:14 } +2024-07-25 22:00:40,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 365/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.68948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:40,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43529 samples/s/p 3:10:21 } +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 367/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.68886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43397 samples/s/p 3:10:21 } +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 369/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.6882399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43620 samples/s/p 3:10:13 } +2024-07-25 22:00:48,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 371/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.6876196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:48,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43591 samples/s/p 3:10:11 } +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 373/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 1.6869997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42474 samples/s/p 3:10:32 } +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 375/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.6863796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:54,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42835 samples/s/p 3:10:21 } +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 377/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.6857595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43710 samples/s/p 3:10:00 } +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 379/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.685139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43136 samples/s/p 3:10:09 } +2024-07-25 22:01:03,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 381/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.6845188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:03,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43582 samples/s/p 3:09:56 } +2024-07-25 22:01:06,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 383/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.6838985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:06,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43085 samples/s/p 3:10:04 } +2024-07-25 22:01:09,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 385/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.6832782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:09,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42943 samples/s/p 3:10:04 } +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 387/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.682658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:12,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42844 samples/s/p 3:10:03 } +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 389/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.6820375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43572 samples/s/p 3:09:45 } +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 391/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.6814174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43273 samples/s/p 3:09:48 } +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 393/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.6807968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43875 samples/s/p 3:09:33 } +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 395/ 1625], loss: 1.084, per_step_time: 1479ms, lr: 1.6801763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.40686 samples/s/p 3:10:37 } +2024-07-25 22:01:27,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 397/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.679556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43725 samples/s/p 3:09:30 } +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 399/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6789356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43450 samples/s/p 3:09:33 } +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 401/ 1625], loss: 1.224, per_step_time: 1475ms, lr: 1.678315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:33,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.42165 samples/s/p 3:09:57 } +2024-07-25 22:01:36,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 403/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 1.6776945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:36,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.44021 samples/s/p 3:09:15 } +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 405/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.6770739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.44091 samples/s/p 3:09:11 } +2024-07-25 22:01:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 407/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.6764534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43415 samples/s/p 3:09:22 } +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 409/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6758328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43575 samples/s/p 3:09:15 } +2024-07-25 22:01:48,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 411/ 1625], loss: 1.214, per_step_time: 1483ms, lr: 1.6752121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:48,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.39196 samples/s/p 3:10:45 } +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 413/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.6745917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43727 samples/s/p 3:09:06 } +2024-07-25 22:01:53,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 415/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.6739708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:53,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43489 samples/s/p 3:09:08 } +2024-07-25 22:01:56,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 417/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.6733502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:56,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.44021 samples/s/p 3:08:54 } +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 419/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.6727296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:59,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42964 samples/s/p 3:09:13 } +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 421/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.672109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:02,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43609 samples/s/p 3:08:57 } +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 423/ 1625], loss: 1.291, per_step_time: 1474ms, lr: 1.671488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42632 samples/s/p 3:09:15 } +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 425/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.6708673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:08,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43819 samples/s/p 3:08:47 } +2024-07-25 22:02:11,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 427/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.6702465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:11,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43790 samples/s/p 3:08:44 } +2024-07-25 22:02:14,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 429/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.6696256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:14,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43119 samples/s/p 3:08:55 } +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 431/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 1.6690048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:17,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.42586 samples/s/p 3:09:04 } +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 433/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.6683838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:20,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43128 samples/s/p 3:08:49 } +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 435/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 1.6677632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43583 samples/s/p 3:08:37 } +2024-07-25 22:02:26,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 437/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.6671422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:26,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43316 samples/s/p 3:08:40 } +2024-07-25 22:02:29,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 439/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.6665212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:29,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43210 samples/s/p 3:08:39 } +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.6659005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43541 samples/s/p 3:08:29 } +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 443/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6652793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:35,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43246 samples/s/p 3:08:32 } +2024-07-25 22:02:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 445/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.6646582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43691 samples/s/p 3:08:20 } +2024-07-25 22:02:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 447/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.6640375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43095 samples/s/p 3:08:29 } +2024-07-25 22:02:44,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 449/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6634163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:44,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43197 samples/s/p 3:08:24 } +2024-07-25 22:02:47,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 451/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 1.6627953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:47,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43980 samples/s/p 3:08:05 } +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 453/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.6621743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:50,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43168 samples/s/p 3:08:19 } +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 455/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.661553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:52,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43526 samples/s/p 3:08:09 } +2024-07-25 22:02:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 457/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 1.6609321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:55,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43638 samples/s/p 3:08:03 } +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 459/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 1.6603108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43352 samples/s/p 3:08:06 } +2024-07-25 22:03:01,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 461/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.6596896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:01,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.44350 samples/s/p 3:07:43 } +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 463/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6590686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:04,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43503 samples/s/p 3:07:57 } +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 465/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.6584474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43118 samples/s/p 3:08:03 } +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 467/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.657826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43493 samples/s/p 3:07:52 } +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 469/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.6572048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43863 samples/s/p 3:07:41 } +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 471/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.6565837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:16,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43138 samples/s/p 3:07:53 } +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 473/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.6559625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43178 samples/s/p 3:07:49 } +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 475/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.6553411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43460 samples/s/p 3:07:41 } +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 477/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.6547197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43495 samples/s/p 3:07:37 } +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 479/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.6540986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43687 samples/s/p 3:07:30 } +2024-07-25 22:03:31,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 481/ 1625], loss: 1.252, per_step_time: 1477ms, lr: 1.653477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:31,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.41536 samples/s/p 3:08:12 } +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 483/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.6528556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:34,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43183 samples/s/p 3:07:35 } +2024-07-25 22:03:37,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 485/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.6522345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:37,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43483 samples/s/p 3:07:25 } +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 487/ 1625], loss: 1.072, per_step_time: 1472ms, lr: 1.651613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43174 samples/s/p 3:07:29 } +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 489/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.6509914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:43,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43220 samples/s/p 3:07:25 } +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 491/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 1.6503702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43892 samples/s/p 3:07:08 } +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 1.6497484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43911 samples/s/p 3:07:05 } +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 495/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.649127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:52,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43824 samples/s/p 3:07:04 } +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 497/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 1.6485055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:54,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43674 samples/s/p 3:07:04 } +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 499/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.6478842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43863 samples/s/p 3:06:57 } +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.6472628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.42428 samples/s/p 3:07:24 } +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 503/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.6466409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.44014 samples/s/p 3:06:48 } +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 505/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.6460193e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:06,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43229 samples/s/p 3:07:01 } +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 507/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.645398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.44076 samples/s/p 3:06:41 } +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 509/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.6447762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:12,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43358 samples/s/p 3:06:53 } +2024-07-25 22:04:15,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 511/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.6441545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:15,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43338 samples/s/p 3:06:50 } +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 513/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 1.6435331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:18,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43668 samples/s/p 3:06:40 } +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 515/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.6429112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43576 samples/s/p 3:06:39 } +2024-07-25 22:04:24,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 517/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.6422895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43135 samples/s/p 3:06:46 } +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 519/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.641668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43225 samples/s/p 3:06:41 } +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 521/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.6410462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:30,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43424 samples/s/p 3:06:34 } +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 523/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.6404245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43390 samples/s/p 3:06:31 } +2024-07-25 22:04:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 525/ 1625], loss: 1.376, per_step_time: 1473ms, lr: 1.6398028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:36,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.42759 samples/s/p 3:06:42 } +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 527/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 1.639181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43095 samples/s/p 3:06:32 } +2024-07-25 22:04:42,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 529/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 1.6385593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44128 samples/s/p 3:06:07 } +2024-07-25 22:04:45,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 531/ 1625], loss: 1.436, per_step_time: 1472ms, lr: 1.6379374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:45,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43133 samples/s/p 3:06:25 } +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 533/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 1.6373155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:48,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43856 samples/s/p 3:06:07 } +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 535/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 1.6366937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43892 samples/s/p 3:06:03 } +2024-07-25 22:04:53,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 537/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.636072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:53,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44155 samples/s/p 3:05:55 } +2024-07-25 22:04:56,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 539/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.6354501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43831 samples/s/p 3:05:59 } +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 541/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 1.6348282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:59,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43381 samples/s/p 3:06:05 } +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 543/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.6342063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:02,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43397 samples/s/p 3:06:02 } +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 545/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6335844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.44013 samples/s/p 3:05:46 } +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 547/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.6329626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43281 samples/s/p 3:05:58 } +2024-07-25 22:05:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 549/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.6323405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43584 samples/s/p 3:05:49 } +2024-07-25 22:05:14,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 551/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.6317186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:14,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43656 samples/s/p 3:05:45 } +2024-07-25 22:05:17,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 553/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 1.6310967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:17,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42378 samples/s/p 3:06:08 } +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 555/ 1625], loss: 1.357, per_step_time: 1471ms, lr: 1.6304746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:20,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43827 samples/s/p 3:05:35 } +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 557/ 1625], loss: 1.058, per_step_time: 1475ms, lr: 1.6298527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42326 samples/s/p 3:06:03 } +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 559/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.6292306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43588 samples/s/p 3:05:34 } +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 561/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.6286087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42811 samples/s/p 3:05:47 } +2024-07-25 22:05:32,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 563/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.6279866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:32,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43552 samples/s/p 3:05:29 } +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 565/ 1625], loss: 0.905, per_step_time: 1471ms, lr: 1.6273645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43604 samples/s/p 3:05:25 } +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 567/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 1.6267424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42904 samples/s/p 3:05:37 } +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 569/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.6261205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43245 samples/s/p 3:05:27 } +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 571/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6254982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.44043 samples/s/p 3:05:07 } +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 573/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.6248761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.44002 samples/s/p 3:05:05 } +2024-07-25 22:05:50,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 575/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.6242542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:50,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42645 samples/s/p 3:05:30 } +2024-07-25 22:05:53,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 577/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 1.623632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:53,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43262 samples/s/p 3:05:15 } +2024-07-25 22:05:55,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 579/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.6230098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:55,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43351 samples/s/p 3:05:10 } +2024-07-25 22:05:58,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 581/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.6223876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:58,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.42703 samples/s/p 3:05:20 } +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 583/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.6217655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43647 samples/s/p 3:04:58 } +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 585/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.6211432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43301 samples/s/p 3:05:02 } +2024-07-25 22:06:07,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 587/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6205211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:07,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43771 samples/s/p 3:04:49 } +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 589/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.6198988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43886 samples/s/p 3:04:44 } +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 591/ 1625], loss: 0.934, per_step_time: 1470ms, lr: 1.6192767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.44099 samples/s/p 3:04:37 } +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 593/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.6186543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43802 samples/s/p 3:04:40 } +2024-07-25 22:06:19,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.618032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43197 samples/s/p 3:04:49 } +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 597/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.6174099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:22,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43870 samples/s/p 3:04:33 } +2024-07-25 22:06:25,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 599/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.6167876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:25,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.44206 samples/s/p 3:04:23 } +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 601/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.6161654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43551 samples/s/p 3:04:33 } +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 603/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.6155429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43480 samples/s/p 3:04:32 } +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 605/ 1625], loss: 1.263, per_step_time: 1470ms, lr: 1.6149206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43881 samples/s/p 3:04:21 } +2024-07-25 22:06:37,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 607/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.6142983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:37,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43395 samples/s/p 3:04:28 } +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 609/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.6136759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43347 samples/s/p 3:04:26 } +2024-07-25 22:06:43,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 611/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6130536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:43,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44041 samples/s/p 3:04:09 } +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 613/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.6124313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:46,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43129 samples/s/p 3:04:24 } +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 615/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.6118087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44110 samples/s/p 3:04:01 } +2024-07-25 22:06:52,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 617/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6111862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:52,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44076 samples/s/p 3:03:59 } +2024-07-25 22:06:54,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1475ms, lr: 1.6105641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:54,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42151 samples/s/p 3:04:35 } +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 621/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 1.6099417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:57,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43089 samples/s/p 3:04:13 } +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 623/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.609319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43532 samples/s/p 3:04:01 } +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 625/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.6086968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43368 samples/s/p 3:04:02 } +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 627/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.6080743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43626 samples/s/p 3:03:54 } +2024-07-25 22:07:09,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 629/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.6074518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:09,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43319 samples/s/p 3:03:57 } +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 631/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.6068294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43384 samples/s/p 3:03:53 } +2024-07-25 22:07:15,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 633/ 1625], loss: 1.459, per_step_time: 1472ms, lr: 1.606207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:15,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43359 samples/s/p 3:03:50 } +2024-07-25 22:07:18,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 635/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.6055847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:18,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43151 samples/s/p 3:03:51 } +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 637/ 1625], loss: 1.307, per_step_time: 1474ms, lr: 1.6049618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42418 samples/s/p 3:04:03 } +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 639/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.6043394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43013 samples/s/p 3:03:48 } +2024-07-25 22:07:27,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 641/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.603717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:27,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43582 samples/s/p 3:03:34 } +2024-07-25 22:07:30,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 643/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.6030945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:30,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43546 samples/s/p 3:03:32 } +2024-07-25 22:07:33,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 645/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.6024716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:33,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43076 samples/s/p 3:03:38 } +2024-07-25 22:07:36,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 647/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.6018494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:36,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43480 samples/s/p 3:03:27 } +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 649/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.6012267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:39,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43169 samples/s/p 3:03:30 } +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.600604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43367 samples/s/p 3:03:23 } +2024-07-25 22:07:45,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 653/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 1.5999816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:45,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43139 samples/s/p 3:03:25 } +2024-07-25 22:07:48,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 655/ 1625], loss: 1.053, per_step_time: 1470ms, lr: 1.599359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:48,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.44211 samples/s/p 3:03:01 } +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 657/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.5987367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:51,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43964 samples/s/p 3:03:03 } +2024-07-25 22:07:54,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 659/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5981137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43349 samples/s/p 3:03:12 } +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 661/ 1625], loss: 1.127, per_step_time: 1469ms, lr: 1.597491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.44259 samples/s/p 3:02:51 } +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 663/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.5968686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43898 samples/s/p 3:02:55 } +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 665/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 1.596246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:02,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43355 samples/s/p 3:03:03 } +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 667/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.5956231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43586 samples/s/p 3:02:56 } +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 669/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.5950009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43633 samples/s/p 3:02:52 } +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 671/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 1.5943782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43858 samples/s/p 3:02:44 } +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 673/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.5937554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:14,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.42710 samples/s/p 3:03:04 } +2024-07-25 22:08:17,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 675/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.5931328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:17,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43817 samples/s/p 3:02:39 } +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 677/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.59251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43420 samples/s/p 3:02:44 } +2024-07-25 22:08:23,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 679/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.5918875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:23,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43559 samples/s/p 3:02:38 } +2024-07-25 22:08:26,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 681/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.5912645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:26,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43859 samples/s/p 3:02:29 } +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 683/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 1.5906418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43616 samples/s/p 3:02:31 } +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 685/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 1.5900194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:32,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43042 samples/s/p 3:02:40 } +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 687/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5893967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43783 samples/s/p 3:02:22 } +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 689/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 1.5887737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:38,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43938 samples/s/p 3:02:16 } +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 691/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.5881511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:41,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43126 samples/s/p 3:02:29 } +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 693/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 1.5875283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:44,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43752 samples/s/p 3:02:14 } +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 695/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 1.5869056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43116 samples/s/p 3:02:24 } +2024-07-25 22:08:50,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 697/ 1625], loss: 1.421, per_step_time: 1473ms, lr: 1.586283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:50,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43103 samples/s/p 3:02:21 } +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 699/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.5856602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43195 samples/s/p 3:02:16 } +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 701/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.5850375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:55,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43395 samples/s/p 3:02:09 } +2024-07-25 22:08:58,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 703/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.5844147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:58,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43392 samples/s/p 3:02:06 } +2024-07-25 22:09:01,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 705/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.5837917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:01,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43709 samples/s/p 3:01:57 } +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 707/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.583169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42839 samples/s/p 3:02:12 } +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 709/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 1.5825464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42533 samples/s/p 3:02:15 } +2024-07-25 22:09:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 711/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.5819236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:10,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43258 samples/s/p 3:01:57 } +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 713/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.5813008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43165 samples/s/p 3:01:56 } +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 715/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5806778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43707 samples/s/p 3:01:42 } +2024-07-25 22:09:19,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 717/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.580055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:19,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43518 samples/s/p 3:01:43 } +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 719/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5794321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:22,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43376 samples/s/p 3:01:43 } +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 721/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.5788095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.44033 samples/s/p 3:01:27 } +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 723/ 1625], loss: 1.309, per_step_time: 1473ms, lr: 1.5781865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43011 samples/s/p 3:01:45 } +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 725/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.5775639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43465 samples/s/p 3:01:33 } +2024-07-25 22:09:34,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 727/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.5769408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43428 samples/s/p 3:01:30 } +2024-07-25 22:09:37,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 729/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.576318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:37,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43598 samples/s/p 3:01:24 } +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 731/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.5756952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:40,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43888 samples/s/p 3:01:15 } +2024-07-25 22:09:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 733/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.5750724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:43,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43564 samples/s/p 3:01:19 } +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 735/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.5744496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43389 samples/s/p 3:01:19 } +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 737/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.5738266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:49,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43211 samples/s/p 3:01:20 } +2024-07-25 22:09:52,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 739/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.5732037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:52,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.44065 samples/s/p 3:01:00 } +2024-07-25 22:09:55,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 741/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 1.5725807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:55,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.44048 samples/s/p 3:00:57 } +2024-07-25 22:09:57,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 743/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.5719581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43068 samples/s/p 3:01:14 } +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 745/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.571335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:00,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43230 samples/s/p 3:01:08 } +2024-07-25 22:10:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 747/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.5707124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42937 samples/s/p 3:01:11 } +2024-07-25 22:10:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 749/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5700893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43873 samples/s/p 3:00:49 } +2024-07-25 22:10:09,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 751/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.5694664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:09,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43592 samples/s/p 3:00:52 } +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 753/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.5688438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42779 samples/s/p 3:01:05 } +2024-07-25 22:10:15,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 755/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.5682208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:15,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43404 samples/s/p 3:00:50 } +2024-07-25 22:10:18,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 757/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 1.5675978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43120 samples/s/p 3:00:52 } +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 759/ 1625], loss: 1.211, per_step_time: 1474ms, lr: 1.5669748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42521 samples/s/p 3:01:01 } +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 761/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.566352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43624 samples/s/p 3:00:36 } +2024-07-25 22:10:27,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 763/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5657291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:27,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43763 samples/s/p 3:00:31 } +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 765/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 1.5651061e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43029 samples/s/p 3:00:42 } +2024-07-25 22:10:33,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 767/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 1.5644831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:33,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42793 samples/s/p 3:00:44 } +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 769/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5638603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:36,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43322 samples/s/p 3:00:31 } +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 771/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.5632373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:39,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43631 samples/s/p 3:00:22 } +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 773/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.5626145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:42,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43501 samples/s/p 3:00:21 } +2024-07-25 22:10:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 775/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.5619917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:45,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43658 samples/s/p 3:00:15 } +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 777/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 1.5613687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.44092 samples/s/p 3:00:04 } +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 779/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5607457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43714 samples/s/p 3:00:08 } +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 781/ 1625], loss: 0.989, per_step_time: 1470ms, lr: 1.5601228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:54,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43972 samples/s/p 3:00:00 } +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 783/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 1.5594998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43027 samples/s/p 3:00:16 } +2024-07-25 22:10:59,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 785/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.5588768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:59,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43357 samples/s/p 3:00:06 } +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 787/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 1.5582538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:02,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43243 samples/s/p 3:00:06 } +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 789/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.5576308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44103 samples/s/p 2:59:46 } +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 791/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.5570082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43862 samples/s/p 2:59:48 } +2024-07-25 22:11:11,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 793/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5563852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44094 samples/s/p 2:59:40 } +2024-07-25 22:11:14,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 795/ 1625], loss: 1.086, per_step_time: 1468ms, lr: 1.5557622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:14,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44603 samples/s/p 2:59:27 } +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 797/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5551394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:17,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43822 samples/s/p 2:59:40 } +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 799/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5545163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:20,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43279 samples/s/p 2:59:47 } +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 801/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.5538935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:23,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43691 samples/s/p 2:59:36 } +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 803/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.5532705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43163 samples/s/p 2:59:44 } +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 805/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 1.5526475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.42963 samples/s/p 2:59:45 } +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 807/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.5520245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43670 samples/s/p 2:59:28 } +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 809/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 1.5514017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:35,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43266 samples/s/p 2:59:33 } +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 811/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5507787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43178 samples/s/p 2:59:32 } +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 813/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5501559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43503 samples/s/p 2:59:22 } +2024-07-25 22:11:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 815/ 1625], loss: 1.127, per_step_time: 1469ms, lr: 1.5495329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44229 samples/s/p 2:59:05 } +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 817/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.5489097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43277 samples/s/p 2:59:21 } +2024-07-25 22:11:50,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 819/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 1.5482869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:50,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44073 samples/s/p 2:59:02 } +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 821/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.5476639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:53,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.42974 samples/s/p 2:59:21 } +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 823/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5470408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:56,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43647 samples/s/p 2:59:05 } +2024-07-25 22:11:58,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 825/ 1625], loss: 1.386, per_step_time: 1471ms, lr: 1.546418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:58,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43794 samples/s/p 2:58:59 } +2024-07-25 22:12:01,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 827/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.5457952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:01,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43525 samples/s/p 2:59:01 } +2024-07-25 22:12:04,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 829/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.545172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:04,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.44198 samples/s/p 2:58:45 } +2024-07-25 22:12:07,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 831/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.544549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43998 samples/s/p 2:58:46 } +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 833/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.5439264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:10,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43699 samples/s/p 2:58:49 } +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 835/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.5433032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43231 samples/s/p 2:58:55 } +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 837/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 1.5426804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:16,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43052 samples/s/p 2:58:56 } +2024-07-25 22:12:19,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 839/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5420575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:19,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43662 samples/s/p 2:58:41 } +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 841/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.5414344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:22,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43324 samples/s/p 2:58:45 } +2024-07-25 22:12:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 843/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.5408115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:25,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43604 samples/s/p 2:58:36 } +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 845/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.5401885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43144 samples/s/p 2:58:42 } +2024-07-25 22:12:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 847/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.5395655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43023 samples/s/p 2:58:42 } +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 849/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.5389427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43407 samples/s/p 2:58:31 } +2024-07-25 22:12:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 851/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.5383197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43748 samples/s/p 2:58:22 } +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 853/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.5376969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:40,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43482 samples/s/p 2:58:24 } +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 855/ 1625], loss: 1.178, per_step_time: 1468ms, lr: 1.5370739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.44732 samples/s/p 2:57:56 } +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 857/ 1625], loss: 1.029, per_step_time: 1470ms, lr: 1.5364512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43975 samples/s/p 2:58:08 } +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 859/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.535828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43679 samples/s/p 2:58:11 } +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 861/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 1.535205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43220 samples/s/p 2:58:17 } +2024-07-25 22:12:55,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 863/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.5345824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43485 samples/s/p 2:58:09 } +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 865/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5339594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43144 samples/s/p 2:58:13 } +2024-07-25 22:13:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 867/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.5333366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.42931 samples/s/p 2:58:14 } +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 869/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.5327136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:03,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43882 samples/s/p 2:57:52 } +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 871/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5320908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43740 samples/s/p 2:57:52 } +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 873/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.5314678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:09,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43562 samples/s/p 2:57:53 } +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 875/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.5308447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43322 samples/s/p 2:57:55 } +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 877/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 1.5302221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44261 samples/s/p 2:57:33 } +2024-07-25 22:13:18,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 879/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.529599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:18,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44112 samples/s/p 2:57:33 } +2024-07-25 22:13:21,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 881/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.5289763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:21,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44043 samples/s/p 2:57:32 } +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 883/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5283535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43879 samples/s/p 2:57:32 } +2024-07-25 22:13:27,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 885/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.5277303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:27,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43262 samples/s/p 2:57:41 } +2024-07-25 22:13:30,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 887/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.5271076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:30,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43491 samples/s/p 2:57:34 } +2024-07-25 22:13:33,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 889/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.5264846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:33,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43286 samples/s/p 2:57:35 } +2024-07-25 22:13:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 891/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.5258617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43681 samples/s/p 2:57:24 } +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 893/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.525239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42991 samples/s/p 2:57:35 } +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 895/ 1625], loss: 1.454, per_step_time: 1473ms, lr: 1.5246163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42957 samples/s/p 2:57:32 } +2024-07-25 22:13:45,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 897/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 1.52399325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.44279 samples/s/p 2:57:03 } +2024-07-25 22:13:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 899/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.5233704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43167 samples/s/p 2:57:22 } +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 901/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.5227477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43344 samples/s/p 2:57:16 } +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 903/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.5221247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.44063 samples/s/p 2:56:59 } +2024-07-25 22:13:56,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 905/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 1.5215018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:56,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43215 samples/s/p 2:57:12 } +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 907/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.5208791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43093 samples/s/p 2:57:12 } +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 909/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.5202561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43727 samples/s/p 2:56:57 } +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 911/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.5196335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43662 samples/s/p 2:56:55 } +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 913/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.5190108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:08,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43614 samples/s/p 2:56:53 } +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 915/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 1.518388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43372 samples/s/p 2:56:55 } +2024-07-25 22:14:14,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 917/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.517765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:14,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43574 samples/s/p 2:56:48 } +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 919/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.5171423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43760 samples/s/p 2:56:41 } +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 921/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.5165197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:20,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43441 samples/s/p 2:56:45 } +2024-07-25 22:14:23,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 923/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.5158967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:23,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43267 samples/s/p 2:56:45 } +2024-07-25 22:14:26,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 925/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5152741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:26,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43675 samples/s/p 2:56:34 } +2024-07-25 22:14:29,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 927/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.5146513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:29,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43295 samples/s/p 2:56:39 } +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 929/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.5140283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43940 samples/s/p 2:56:23 } +2024-07-25 22:14:35,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 931/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5134057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:35,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43136 samples/s/p 2:56:36 } +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 933/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.512783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43427 samples/s/p 2:56:27 } +2024-07-25 22:14:41,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 935/ 1625], loss: 0.977, per_step_time: 1469ms, lr: 1.51216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:41,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.44277 samples/s/p 2:56:08 } +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 937/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.51153745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42848 samples/s/p 2:56:33 } +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 939/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.5109149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43817 samples/s/p 2:56:11 } +2024-07-25 22:14:50,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 941/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.510292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:50,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43749 samples/s/p 2:56:09 } +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 943/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.5096692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43074 samples/s/p 2:56:19 } +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 945/ 1625], loss: 1.348, per_step_time: 1473ms, lr: 1.5090467e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:56,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43049 samples/s/p 2:56:17 } +2024-07-25 22:14:58,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 947/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.5084238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:58,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43484 samples/s/p 2:56:05 } +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 949/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.5078011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43771 samples/s/p 2:55:57 } +2024-07-25 22:15:04,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 951/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5071786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:04,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43607 samples/s/p 2:55:57 } +2024-07-25 22:15:07,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 953/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.5065557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:07,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43557 samples/s/p 2:55:55 } +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 955/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.5059332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43405 samples/s/p 2:55:55 } +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 957/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.5053105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43476 samples/s/p 2:55:51 } +2024-07-25 22:15:16,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 959/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 1.5046878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43741 samples/s/p 2:55:43 } +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 961/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5040652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43390 samples/s/p 2:55:47 } +2024-07-25 22:15:22,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 963/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5034426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:22,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.42907 samples/s/p 2:55:53 } +2024-07-25 22:15:25,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 965/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.5028201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43583 samples/s/p 2:55:37 } +2024-07-25 22:15:28,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 967/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.5021974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43697 samples/s/p 2:55:32 } +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 969/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.5015748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43619 samples/s/p 2:55:30 } +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 971/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.5009523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43852 samples/s/p 2:55:23 } +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 973/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.5003295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.44164 samples/s/p 2:55:14 } +2024-07-25 22:15:40,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 975/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.499707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:40,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43308 samples/s/p 2:55:28 } +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 977/ 1625], loss: 0.963, per_step_time: 1472ms, lr: 1.4990845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43394 samples/s/p 2:55:23 } +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 979/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.4984617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:46,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43413 samples/s/p 2:55:20 } +2024-07-25 22:15:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 981/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.4978394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43725 samples/s/p 2:55:11 } +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 983/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.4972169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43036 samples/s/p 2:55:21 } +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 985/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.4965942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43639 samples/s/p 2:55:06 } +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 987/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.4959717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43508 samples/s/p 2:55:06 } +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 989/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.49534935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43293 samples/s/p 2:55:07 } +2024-07-25 22:16:03,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 991/ 1625], loss: 1.453, per_step_time: 1470ms, lr: 1.4947266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.44080 samples/s/p 2:54:49 } +2024-07-25 22:16:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 993/ 1625], loss: 0.994, per_step_time: 1472ms, lr: 1.4941042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43284 samples/s/p 2:55:02 } +2024-07-25 22:16:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 995/ 1625], loss: 1.162, per_step_time: 1474ms, lr: 1.4934818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.42439 samples/s/p 2:55:15 } +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 997/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.4928592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43734 samples/s/p 2:54:47 } +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 999/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4922369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43042 samples/s/p 2:54:57 } +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1001/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.4916144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43342 samples/s/p 2:54:49 } +2024-07-25 22:16:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1003/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.4909918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43725 samples/s/p 2:54:38 } +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1005/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.4903695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43964 samples/s/p 2:54:31 } +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1007/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.48974705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43253 samples/s/p 2:54:42 } +2024-07-25 22:16:30,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1009/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.4891244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:30,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43174 samples/s/p 2:54:40 } +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1011/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.4885022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.42893 samples/s/p 2:54:43 } +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1013/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 1.4878799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:36,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43035 samples/s/p 2:54:37 } +2024-07-25 22:16:39,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1015/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.4872577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:39,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43282 samples/s/p 2:54:29 } +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1017/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.4866351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43535 samples/s/p 2:54:21 } +2024-07-25 22:16:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1019/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 1.4860129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43975 samples/s/p 2:54:10 } +2024-07-25 22:16:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1021/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.4853906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43640 samples/s/p 2:54:13 } +2024-07-25 22:16:51,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1023/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4847682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:51,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43155 samples/s/p 2:54:20 } +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1025/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 1.4841458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.44105 samples/s/p 2:53:59 } +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1027/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 1.4835237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:56,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43138 samples/s/p 2:54:14 } +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1029/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.4829013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:59,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.42933 samples/s/p 2:54:15 } +2024-07-25 22:17:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1031/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.4822789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:02,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43647 samples/s/p 2:53:59 } +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1033/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.4816568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:05,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43933 samples/s/p 2:53:50 } +2024-07-25 22:17:08,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1035/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.4810344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.44139 samples/s/p 2:53:43 } +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1037/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.4804124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43953 samples/s/p 2:53:44 } +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1039/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.4797901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43515 samples/s/p 2:53:49 } +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1041/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.4791677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43112 samples/s/p 2:53:54 } +2024-07-25 22:17:20,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1043/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.4785456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43347 samples/s/p 2:53:47 } +2024-07-25 22:17:23,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1045/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 1.4779234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:23,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43849 samples/s/p 2:53:34 } +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1047/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.4773011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43242 samples/s/p 2:53:43 } +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1049/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.4766791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:29,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44000 samples/s/p 2:53:25 } +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1051/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.4760571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44072 samples/s/p 2:53:21 } +2024-07-25 22:17:35,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1053/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.4754348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:35,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43230 samples/s/p 2:53:34 } +2024-07-25 22:17:38,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1055/ 1625], loss: 1.296, per_step_time: 1469ms, lr: 1.4748127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:38,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44254 samples/s/p 2:53:12 } +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1057/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.4741907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:41,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43495 samples/s/p 2:53:23 } +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1059/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.4735684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43519 samples/s/p 2:53:20 } +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1061/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.4729463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.42758 samples/s/p 2:53:32 } +2024-07-25 22:17:50,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1063/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.4723245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:50,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43387 samples/s/p 2:53:17 } +2024-07-25 22:17:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1065/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.4717026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:53,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43894 samples/s/p 2:53:04 } +2024-07-25 22:17:56,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1067/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.4710804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:56,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43072 samples/s/p 2:53:17 } +2024-07-25 22:17:58,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1069/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.4704584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:58,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.44042 samples/s/p 2:52:55 } +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1071/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.4698364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:01,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42885 samples/s/p 2:53:14 } +2024-07-25 22:18:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1073/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 1.4692143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:04,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42676 samples/s/p 2:53:15 } +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1075/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4685923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43204 samples/s/p 2:53:02 } +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1077/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.4679705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43550 samples/s/p 2:52:53 } +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1079/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.4673484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42919 samples/s/p 2:53:02 } +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1081/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 1.4667266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42920 samples/s/p 2:52:59 } +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1083/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.4661047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43503 samples/s/p 2:52:45 } +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1085/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.46548255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43114 samples/s/p 2:52:49 } +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1087/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.4648608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43143 samples/s/p 2:52:46 } +2024-07-25 22:18:28,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1089/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.464239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:28,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43707 samples/s/p 2:52:32 } +2024-07-25 22:18:31,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1091/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.4636169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:31,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43419 samples/s/p 2:52:35 } +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1093/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.4629953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42694 samples/s/p 2:52:46 } +2024-07-25 22:18:37,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1095/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.4623735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43913 samples/s/p 2:52:19 } +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1097/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.4617516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:40,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43451 samples/s/p 2:52:25 } +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1099/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.4611298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43966 samples/s/p 2:52:12 } +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1101/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.46050825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43883 samples/s/p 2:52:11 } +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1103/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 1.4598862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:49,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43208 samples/s/p 2:52:21 } +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1105/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4592645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:52,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43444 samples/s/p 2:52:14 } +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1107/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.458643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43756 samples/s/p 2:52:05 } +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1109/ 1625], loss: 0.965, per_step_time: 1471ms, lr: 1.45802105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:57,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43577 samples/s/p 2:52:05 } +2024-07-25 22:19:00,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1111/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.4573995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:00,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.44022 samples/s/p 2:51:54 } +2024-07-25 22:19:03,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1113/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.4567779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:03,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43621 samples/s/p 2:51:58 } +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1115/ 1625], loss: 0.994, per_step_time: 1469ms, lr: 1.456156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:06,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.44363 samples/s/p 2:51:41 } +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1117/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4555345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:09,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43814 samples/s/p 2:51:49 } +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1119/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 1.45491285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:12,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43723 samples/s/p 2:51:48 } +2024-07-25 22:19:15,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1121/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.4542915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:15,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43621 samples/s/p 2:51:47 } +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1123/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.4536697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43169 samples/s/p 2:51:52 } +2024-07-25 22:19:21,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1125/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 1.4530483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:21,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43028 samples/s/p 2:51:52 } +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1127/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.45242675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43502 samples/s/p 2:51:40 } +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1129/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.451805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43468 samples/s/p 2:51:38 } +2024-07-25 22:19:30,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1131/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.45118365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:30,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43757 samples/s/p 2:51:29 } +2024-07-25 22:19:33,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1133/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.4505621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:33,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.42774 samples/s/p 2:51:45 } +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1135/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.4499405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43363 samples/s/p 2:51:31 } +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1137/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.4493192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43533 samples/s/p 2:51:25 } +2024-07-25 22:19:42,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1139/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.4486979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43553 samples/s/p 2:51:21 } +2024-07-25 22:19:45,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1141/ 1625], loss: 1.429, per_step_time: 1471ms, lr: 1.4480763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:45,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43518 samples/s/p 2:51:19 } +2024-07-25 22:19:48,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1143/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.4474548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:48,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43775 samples/s/p 2:51:11 } +2024-07-25 22:19:51,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1145/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.4468337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:51,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.44011 samples/s/p 2:51:04 } +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1147/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.4462121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:54,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43368 samples/s/p 2:51:13 } +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.4455908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43571 samples/s/p 2:51:06 } +2024-07-25 22:19:59,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1151/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4449695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:59,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43578 samples/s/p 2:51:03 } +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1153/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.4443482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43404 samples/s/p 2:51:04 } +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1155/ 1625], loss: 1.054, per_step_time: 1473ms, lr: 1.443727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.42821 samples/s/p 2:51:12 } +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1157/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.4431057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43736 samples/s/p 2:50:52 } +2024-07-25 22:20:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1159/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.4424842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43396 samples/s/p 2:50:55 } +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1161/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.4418632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43723 samples/s/p 2:50:46 } +2024-07-25 22:20:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1163/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.441242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:17,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43624 samples/s/p 2:50:45 } +2024-07-25 22:20:20,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1165/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.4406206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:20,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43285 samples/s/p 2:50:48 } +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1167/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.4399996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:23,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43475 samples/s/p 2:50:42 } +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1169/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.4393786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43369 samples/s/p 2:50:41 } +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1171/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4387574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43910 samples/s/p 2:50:28 } +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1173/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4381362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43278 samples/s/p 2:50:37 } +2024-07-25 22:20:35,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1175/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.4375152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43237 samples/s/p 2:50:34 } +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1177/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4368942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43612 samples/s/p 2:50:24 } +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1179/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.4362731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43308 samples/s/p 2:50:27 } +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1181/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.435652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43641 samples/s/p 2:50:18 } +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1183/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 1.4350312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42625 samples/s/p 2:50:34 } +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1185/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.4344101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:50,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43386 samples/s/p 2:50:17 } +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1187/ 1625], loss: 1.237, per_step_time: 1474ms, lr: 1.4337891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42497 samples/s/p 2:50:31 } +2024-07-25 22:20:56,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1189/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.4331683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:56,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43719 samples/s/p 2:50:05 } +2024-07-25 22:20:58,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1191/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.4325473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43409 samples/s/p 2:50:08 } +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1193/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.4319266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43654 samples/s/p 2:50:00 } +2024-07-25 22:21:04,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1195/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.4313056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:04,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43954 samples/s/p 2:49:52 } +2024-07-25 22:21:07,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1197/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 1.43068455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:07,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.42437 samples/s/p 2:50:17 } +2024-07-25 22:21:10,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1199/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.4300639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:10,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43756 samples/s/p 2:49:49 } +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1201/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.4294431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:13,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43287 samples/s/p 2:49:55 } +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1203/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.4288221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43578 samples/s/p 2:49:47 } +2024-07-25 22:21:19,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1205/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.4282015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43701 samples/s/p 2:49:42 } +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1207/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.4275809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:22,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43503 samples/s/p 2:49:42 } +2024-07-25 22:21:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1209/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.42696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43293 samples/s/p 2:49:43 } +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1211/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.42633935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:28,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43936 samples/s/p 2:49:28 } +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1213/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.4257189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:31,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43928 samples/s/p 2:49:26 } +2024-07-25 22:21:34,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1215/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.425098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:34,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43301 samples/s/p 2:49:34 } +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1217/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.4244773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:37,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43824 samples/s/p 2:49:22 } +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1219/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.423857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:40,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43815 samples/s/p 2:49:19 } +2024-07-25 22:21:43,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1221/ 1625], loss: 0.899, per_step_time: 1471ms, lr: 1.4232365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:43,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43744 samples/s/p 2:49:17 } +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1223/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 1.4226158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43309 samples/s/p 2:49:22 } +2024-07-25 22:21:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1225/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.4219952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43566 samples/s/p 2:49:15 } +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1227/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.4213749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43398 samples/s/p 2:49:15 } +2024-07-25 22:21:55,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1229/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 1.4207542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:55,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.42998 samples/s/p 2:49:19 } +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1231/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.4201337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:58,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43786 samples/s/p 2:49:02 } +2024-07-25 22:22:00,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1233/ 1625], loss: 0.931, per_step_time: 1470ms, lr: 1.4195134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:00,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44039 samples/s/p 2:48:54 } +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1235/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4188929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43425 samples/s/p 2:49:03 } +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1237/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.4182727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:06,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43822 samples/s/p 2:48:52 } +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1239/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.4176523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44053 samples/s/p 2:48:45 } +2024-07-25 22:22:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1241/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.4170318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43735 samples/s/p 2:48:48 } +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.4164116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43219 samples/s/p 2:48:55 } +2024-07-25 22:22:18,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1245/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.4157913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43436 samples/s/p 2:48:48 } +2024-07-25 22:22:21,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1247/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.41517085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43159 samples/s/p 2:48:50 } +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1249/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.41455075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43818 samples/s/p 2:48:35 } +2024-07-25 22:22:27,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1251/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.4139307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:27,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43564 samples/s/p 2:48:36 } +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1253/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.4133103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.42987 samples/s/p 2:48:44 } +2024-07-25 22:22:33,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1255/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.4126901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:33,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43821 samples/s/p 2:48:26 } +2024-07-25 22:22:36,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1257/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.4120702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:36,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43260 samples/s/p 2:48:33 } +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1259/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4114499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43408 samples/s/p 2:48:28 } +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1261/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.4108297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42646 samples/s/p 2:48:39 } +2024-07-25 22:22:45,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1263/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.4102098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43358 samples/s/p 2:48:23 } +2024-07-25 22:22:48,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1265/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 1.4095896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:48,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43475 samples/s/p 2:48:17 } +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1267/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.4089698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:51,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43110 samples/s/p 2:48:21 } +2024-07-25 22:22:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1269/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 1.4083497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.44192 samples/s/p 2:47:58 } +2024-07-25 22:22:57,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1271/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.40773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:57,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43481 samples/s/p 2:48:09 } +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1273/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4071099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:59,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43748 samples/s/p 2:48:01 } +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1275/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 1.40649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:02,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43911 samples/s/p 2:47:55 } +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1277/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.4058703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:05,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43450 samples/s/p 2:48:00 } +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1279/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4052503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44030 samples/s/p 2:47:47 } +2024-07-25 22:23:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1281/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.4046305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:11,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43974 samples/s/p 2:47:45 } +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1283/ 1625], loss: 1.002, per_step_time: 1469ms, lr: 1.4040107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44382 samples/s/p 2:47:34 } +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1285/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.4033908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:17,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44144 samples/s/p 2:47:36 } +2024-07-25 22:23:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1287/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.4027712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:20,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43901 samples/s/p 2:47:37 } +2024-07-25 22:23:23,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1289/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.4021515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43111 samples/s/p 2:47:49 } +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1291/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4015315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44198 samples/s/p 2:47:26 } +2024-07-25 22:23:29,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1293/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.4009121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:29,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43059 samples/s/p 2:47:44 } +2024-07-25 22:23:32,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1295/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.4002926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:32,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43736 samples/s/p 2:47:29 } +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1297/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 1.3996728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43960 samples/s/p 2:47:21 } +2024-07-25 22:23:38,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1299/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 1.3990531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:38,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42440 samples/s/p 2:47:47 } +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1301/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.3984339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43944 samples/s/p 2:47:16 } +2024-07-25 22:23:44,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1303/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.39781405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:44,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43978 samples/s/p 2:47:12 } +2024-07-25 22:23:47,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1305/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.3971946e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43339 samples/s/p 2:47:21 } +2024-07-25 22:23:50,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1307/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.3965752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:50,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43666 samples/s/p 2:47:12 } +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1309/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.3959557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43470 samples/s/p 2:47:13 } +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1311/ 1625], loss: 1.327, per_step_time: 1474ms, lr: 1.3953364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.42692 samples/s/p 2:47:24 } +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1313/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.39471695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43741 samples/s/p 2:47:02 } +2024-07-25 22:24:01,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1315/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.3940975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:01,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43968 samples/s/p 2:46:55 } +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1317/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.3934783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:04,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43866 samples/s/p 2:46:54 } +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1319/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 1.3928589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43726 samples/s/p 2:46:53 } +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1321/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.3922399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43569 samples/s/p 2:46:53 } +2024-07-25 22:24:13,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1323/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 1.3916205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:13,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43129 samples/s/p 2:46:58 } +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1325/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.3910014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43573 samples/s/p 2:46:47 } +2024-07-25 22:24:19,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1327/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.3903823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:19,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43308 samples/s/p 2:46:49 } +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1329/ 1625], loss: 1.335, per_step_time: 1470ms, lr: 1.3897629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.44183 samples/s/p 2:46:30 } +2024-07-25 22:24:25,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1331/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.3891439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:25,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43621 samples/s/p 2:46:38 } +2024-07-25 22:24:28,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1333/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.3885248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:28,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43501 samples/s/p 2:46:37 } +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1335/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.38790565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:31,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43902 samples/s/p 2:46:27 } +2024-07-25 22:24:34,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1337/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.3872867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:34,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43227 samples/s/p 2:46:36 } +2024-07-25 22:24:37,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1339/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.3866679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:37,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43951 samples/s/p 2:46:20 } +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1341/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.3860487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43407 samples/s/p 2:46:27 } +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1343/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.3854297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:43,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43625 samples/s/p 2:46:20 } +2024-07-25 22:24:46,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1345/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.384811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:46,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43634 samples/s/p 2:46:17 } +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1347/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.3841919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43688 samples/s/p 2:46:13 } +2024-07-25 22:24:52,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1349/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 1.3835732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:52,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43089 samples/s/p 2:46:21 } +2024-07-25 22:24:55,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1351/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 1.3829544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:55,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.44406 samples/s/p 2:45:54 } +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1353/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.38233545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:58,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.42929 samples/s/p 2:46:18 } +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1355/ 1625], loss: 0.868, per_step_time: 1471ms, lr: 1.3817168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43738 samples/s/p 2:46:00 } +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1357/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.3810981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43257 samples/s/p 2:46:06 } +2024-07-25 22:25:06,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1359/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.3804793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:06,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43840 samples/s/p 2:45:52 } +2024-07-25 22:25:09,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1361/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.3798607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:09,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43395 samples/s/p 2:45:58 } +2024-07-25 22:25:12,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1363/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.3792423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:12,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43842 samples/s/p 2:45:47 } +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1365/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.3786234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:15,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43679 samples/s/p 2:45:47 } +2024-07-25 22:25:18,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.3780049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:18,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43756 samples/s/p 2:45:42 } +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1369/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.3773865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:21,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43525 samples/s/p 2:45:43 } +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1371/ 1625], loss: 1.344, per_step_time: 1472ms, lr: 1.376768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:24,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43251 samples/s/p 2:45:46 } +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1373/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3761493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:27,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43416 samples/s/p 2:45:40 } +2024-07-25 22:25:30,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1375/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.3755311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:30,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43073 samples/s/p 2:45:43 } +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1377/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.3749128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43111 samples/s/p 2:45:39 } +2024-07-25 22:25:36,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1379/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.3742942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:36,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43056 samples/s/p 2:45:37 } +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1381/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.3736759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43649 samples/s/p 2:45:24 } +2024-07-25 22:25:42,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1383/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 1.3730578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:42,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43497 samples/s/p 2:45:23 } +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1385/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.3724393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43429 samples/s/p 2:45:22 } +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1387/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.371821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43939 samples/s/p 2:45:09 } +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1389/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.371203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43830 samples/s/p 2:45:08 } +2024-07-25 22:25:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1391/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.3705846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43431 samples/s/p 2:45:13 } +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1393/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 1.3699666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43076 samples/s/p 2:45:16 } +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1395/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.3693485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:59,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43340 samples/s/p 2:45:09 } +2024-07-25 22:26:02,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1397/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3687302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:02,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43427 samples/s/p 2:45:04 } +2024-07-25 22:26:05,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1399/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.3681123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:05,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43481 samples/s/p 2:45:00 } +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1401/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.3674943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43490 samples/s/p 2:44:57 } +2024-07-25 22:26:11,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1403/ 1625], loss: 1.364, per_step_time: 1473ms, lr: 1.366876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43017 samples/s/p 2:45:03 } +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1405/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.3662583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43930 samples/s/p 2:44:43 } +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1407/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.3656406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43566 samples/s/p 2:44:47 } +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1409/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.3650226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:20,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43462 samples/s/p 2:44:46 } +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1411/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.3644046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43947 samples/s/p 2:44:34 } +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1413/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.363787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:26,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42820 samples/s/p 2:44:52 } +2024-07-25 22:26:29,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1415/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.363169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:29,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42349 samples/s/p 2:44:57 } +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1417/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3625513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:32,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43720 samples/s/p 2:44:29 } +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1419/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.3619338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43639 samples/s/p 2:44:28 } +2024-07-25 22:26:38,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1421/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3613162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43662 samples/s/p 2:44:24 } +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1423/ 1625], loss: 0.930, per_step_time: 1470ms, lr: 1.3606985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:41,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43919 samples/s/p 2:44:17 } +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1425/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.36008075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:44,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43671 samples/s/p 2:44:18 } +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1427/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.3594635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:47,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.44204 samples/s/p 2:44:06 } +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1429/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.3588457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:50,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43184 samples/s/p 2:44:21 } +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1431/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3582282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43037 samples/s/p 2:44:21 } +2024-07-25 22:26:56,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1433/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.3576108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:56,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43501 samples/s/p 2:44:10 } +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1435/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.3569933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43560 samples/s/p 2:44:06 } +2024-07-25 22:27:01,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1437/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.356376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43574 samples/s/p 2:44:02 } +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1439/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.35575865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43595 samples/s/p 2:43:59 } +2024-07-25 22:27:07,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1441/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3551411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:07,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43196 samples/s/p 2:44:03 } +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1443/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 1.3545241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42600 samples/s/p 2:44:11 } +2024-07-25 22:27:13,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1445/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 1.3539068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:13,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43700 samples/s/p 2:43:48 } +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1447/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.3532894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43857 samples/s/p 2:43:43 } +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1449/ 1625], loss: 1.323, per_step_time: 1475ms, lr: 1.3526724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:19,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42304 samples/s/p 2:44:08 } +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1451/ 1625], loss: 1.318, per_step_time: 1470ms, lr: 1.3520554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:22,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43964 samples/s/p 2:43:35 } +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1453/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.3514381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43561 samples/s/p 2:43:39 } +2024-07-25 22:27:28,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1455/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.350821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:28,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43512 samples/s/p 2:43:37 } +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1457/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.3502042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:31,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43907 samples/s/p 2:43:27 } +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1459/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.349587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42851 samples/s/p 2:43:43 } +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1461/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.34897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:37,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42854 samples/s/p 2:43:40 } +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1463/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.3483533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43340 samples/s/p 2:43:28 } +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1465/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.3477362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43736 samples/s/p 2:43:18 } +2024-07-25 22:27:46,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1467/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 1.3471195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:46,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42732 samples/s/p 2:43:34 } +2024-07-25 22:27:49,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1469/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.3465027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:49,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43195 samples/s/p 2:43:22 } +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1471/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.3458862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43508 samples/s/p 2:43:14 } +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1473/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 1.3452693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42880 samples/s/p 2:43:22 } +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1475/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 1.34465245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42989 samples/s/p 2:43:17 } +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1477/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.344036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42909 samples/s/p 2:43:16 } +2024-07-25 22:28:03,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1479/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.3434192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:03,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43662 samples/s/p 2:42:59 } +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1481/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3428028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43618 samples/s/p 2:42:57 } +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1483/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3421862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43230 samples/s/p 2:43:01 } +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1485/ 1625], loss: 1.308, per_step_time: 1473ms, lr: 1.3415694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42823 samples/s/p 2:43:05 } +2024-07-25 22:28:15,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1487/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 1.3409533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:15,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44041 samples/s/p 2:42:41 } +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1489/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.3403368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43838 samples/s/p 2:42:41 } +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1491/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3397202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:21,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43201 samples/s/p 2:42:50 } +2024-07-25 22:28:24,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1493/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3391041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:24,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43597 samples/s/p 2:42:40 } +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1495/ 1625], loss: 1.274, per_step_time: 1470ms, lr: 1.3384878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44092 samples/s/p 2:42:28 } +2024-07-25 22:28:30,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1497/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.3378714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:30,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43567 samples/s/p 2:42:34 } +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1499/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.33725525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44024 samples/s/p 2:42:23 } +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1501/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 1.3366392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43771 samples/s/p 2:42:25 } +2024-07-25 22:28:39,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1503/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.3360228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:39,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43426 samples/s/p 2:42:28 } +2024-07-25 22:28:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1505/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.3354069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43655 samples/s/p 2:42:21 } +2024-07-25 22:28:45,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1507/ 1625], loss: 1.030, per_step_time: 1469ms, lr: 1.3347908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:45,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44470 samples/s/p 2:42:03 } +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1509/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.3341745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:48,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43527 samples/s/p 2:42:17 } +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1511/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.3335588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:51,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.42966 samples/s/p 2:42:25 } +2024-07-25 22:28:54,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1513/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.3329428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:54,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43356 samples/s/p 2:42:15 } +2024-07-25 22:28:57,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1515/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 1.3323266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:57,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44036 samples/s/p 2:41:59 } +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1517/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.331711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:00,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43744 samples/s/p 2:42:02 } +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1519/ 1625], loss: 0.962, per_step_time: 1471ms, lr: 1.3310952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:02,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43842 samples/s/p 2:41:57 } +2024-07-25 22:29:05,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1521/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.3304794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:05,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43458 samples/s/p 2:42:01 } +2024-07-25 22:29:08,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1523/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.3298636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:08,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44067 samples/s/p 2:41:47 } +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1525/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.329248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43199 samples/s/p 2:42:00 } +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1527/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.3286323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:14,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43230 samples/s/p 2:41:56 } +2024-07-25 22:29:17,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1529/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 1.3280165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43966 samples/s/p 2:41:40 } +2024-07-25 22:29:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1531/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.3274011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:20,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43202 samples/s/p 2:41:51 } +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1533/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.3267857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43400 samples/s/p 2:41:44 } +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1535/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.32617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43108 samples/s/p 2:41:47 } +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1537/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3255545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.42938 samples/s/p 2:41:47 } +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3249392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43377 samples/s/p 2:41:36 } +2024-07-25 22:29:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1541/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.3243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43672 samples/s/p 2:41:28 } +2024-07-25 22:29:38,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1543/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.3237083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:38,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.44008 samples/s/p 2:41:19 } +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1545/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.32309315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43489 samples/s/p 2:41:25 } +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1547/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.3224778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:44,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43278 samples/s/p 2:41:26 } +2024-07-25 22:29:47,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1549/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.3218627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:47,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43374 samples/s/p 2:41:21 } +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1551/ 1625], loss: 1.002, per_step_time: 1472ms, lr: 1.3212475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43445 samples/s/p 2:41:17 } +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1553/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3206322e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43607 samples/s/p 2:41:11 } +2024-07-25 22:29:56,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1555/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.3200172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:56,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43605 samples/s/p 2:41:08 } +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1557/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 1.3194022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:59,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42990 samples/s/p 2:41:16 } +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1559/ 1625], loss: 1.376, per_step_time: 1474ms, lr: 1.31878705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42635 samples/s/p 2:41:20 } +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1561/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.3181722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:04,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42902 samples/s/p 2:41:12 } +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1563/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.3175575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43905 samples/s/p 2:40:51 } +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1565/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.3169424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42755 samples/s/p 2:41:09 } +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1567/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.3163276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43111 samples/s/p 2:40:59 } +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1569/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.315713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43260 samples/s/p 2:40:54 } +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1571/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.3150981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43831 samples/s/p 2:40:41 } +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1573/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.3144833e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43540 samples/s/p 2:40:43 } +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1575/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.3138689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43679 samples/s/p 2:40:38 } +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1577/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.3132543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43509 samples/s/p 2:40:38 } +2024-07-25 22:30:31,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1579/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.3126396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:31,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43578 samples/s/p 2:40:33 } +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1581/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.31202505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:34,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43125 samples/s/p 2:40:39 } +2024-07-25 22:30:37,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1583/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.3114108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:37,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43070 samples/s/p 2:40:37 } +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1585/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.3107961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43426 samples/s/p 2:40:27 } +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1587/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3101817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:43,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43441 samples/s/p 2:40:24 } +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1589/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 1.3095676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43906 samples/s/p 2:40:13 } +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1591/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.30895305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43525 samples/s/p 2:40:17 } +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1593/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 1.3083389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.42252 samples/s/p 2:40:36 } +2024-07-25 22:30:55,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1595/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.3077247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:55,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43335 samples/s/p 2:40:14 } +2024-07-25 22:30:58,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1597/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3071103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:58,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43474 samples/s/p 2:40:09 } +2024-07-25 22:31:01,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1599/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 1.3064964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:01,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43046 samples/s/p 2:40:13 } +2024-07-25 22:31:03,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1601/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.3058823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:03,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43489 samples/s/p 2:40:03 } +2024-07-25 22:31:06,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1603/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.30526805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:06,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.44035 samples/s/p 2:39:50 } +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1605/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.3046542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:09,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43350 samples/s/p 2:39:59 } +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1607/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3040404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43447 samples/s/p 2:39:55 } +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1609/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.3034263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43254 samples/s/p 2:39:55 } +2024-07-25 22:31:18,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1611/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 1.3028125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:18,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43435 samples/s/p 2:39:49 } +2024-07-25 22:31:21,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1613/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.3021988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:21,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43449 samples/s/p 2:39:46 } +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1615/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43548 samples/s/p 2:39:41 } +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1617/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.3009712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:27,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.44116 samples/s/p 2:39:28 } +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1619/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.3003577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43021 samples/s/p 2:39:44 } +2024-07-25 22:31:33,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1621/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 1.2997442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:33,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43054 samples/s/p 2:39:41 } +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1623/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.2991304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43760 samples/s/p 2:39:25 } +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1625/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.2985169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43108 samples/s/p 2:39:34 } +2024-07-25 22:31:42,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 2/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.2979036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:42,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43723 samples/s/p 2:39:20 } +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 4/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 1.29729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43961 samples/s/p 2:39:13 } +2024-07-25 22:31:48,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 6/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 1.2966765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:48,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43617 samples/s/p 2:39:16 } +2024-07-25 22:31:51,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 8/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 1.2960634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:51,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.44044 samples/s/p 2:39:06 } +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 10/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.2954499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43806 samples/s/p 2:39:07 } +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 12/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2948367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43976 samples/s/p 2:39:01 } +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 14/ 1625], loss: 1.305, per_step_time: 1469ms, lr: 1.2942235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:00,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44364 samples/s/p 2:38:51 } +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 16/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.2936102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:02,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43459 samples/s/p 2:39:04 } +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 18/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.2929972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43905 samples/s/p 2:38:54 } +2024-07-25 22:32:08,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 20/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.29238415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:08,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43554 samples/s/p 2:38:57 } +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 22/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 1.2917709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43307 samples/s/p 2:38:58 } +2024-07-25 22:32:14,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 1.29115815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:14,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43347 samples/s/p 2:38:54 } +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 26/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.2905453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:17,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43315 samples/s/p 2:38:52 } +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 28/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.2899323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43722 samples/s/p 2:38:42 } +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 30/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.2893195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43483 samples/s/p 2:38:43 } +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 32/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.2887069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43642 samples/s/p 2:38:38 } +2024-07-25 22:32:29,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 34/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.288094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:29,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43058 samples/s/p 2:38:45 } +2024-07-25 22:32:32,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 36/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.28748125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:32,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43432 samples/s/p 2:38:35 } +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 38/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.2868688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.42986 samples/s/p 2:38:40 } +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 40/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 1.286256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43893 samples/s/p 2:38:21 } +2024-07-25 22:32:41,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 42/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.2856436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:41,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43364 samples/s/p 2:38:28 } +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 44/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.2850312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43551 samples/s/p 2:38:21 } +2024-07-25 22:32:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 46/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.2844189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:47,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43804 samples/s/p 2:38:14 } +2024-07-25 22:32:50,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 48/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.2838063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:50,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43399 samples/s/p 2:38:18 } +2024-07-25 22:32:53,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 50/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 1.2831941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43111 samples/s/p 2:38:20 } +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 52/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.2825818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:28,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43999 samples/s/p 2:38:02 } +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 54/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2819694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:31,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43302 samples/s/p 2:38:11 } +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 56/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.2813573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43013 samples/s/p 2:38:13 } +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 58/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.2807452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:37,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43215 samples/s/p 2:38:07 } +2024-07-25 22:33:40,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 60/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.280133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:40,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43209 samples/s/p 2:38:04 } +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 62/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.2795211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43234 samples/s/p 2:38:00 } +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 64/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.2789093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:46,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43816 samples/s/p 2:37:47 } +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 66/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.2782971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43408 samples/s/p 2:37:52 } +2024-07-25 22:33:52,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 68/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2776852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:52,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43160 samples/s/p 2:37:53 } +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 70/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.2770735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43554 samples/s/p 2:37:43 } +2024-07-25 22:33:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 72/ 1625], loss: 1.026, per_step_time: 1469ms, lr: 1.2764615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:58,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.44398 samples/s/p 2:37:26 } +2024-07-25 22:34:01,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 74/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.2758497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:01,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43818 samples/s/p 2:37:33 } +2024-07-25 22:34:04,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 76/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.2752383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:04,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43674 samples/s/p 2:37:32 } +2024-07-25 22:34:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 78/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.27462645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:07,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.42800 samples/s/p 2:37:44 } +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 80/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.274015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43767 samples/s/p 2:37:25 } +2024-07-25 22:34:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 82/ 1625], loss: 1.343, per_step_time: 1470ms, lr: 1.27340345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43926 samples/s/p 2:37:19 } +2024-07-25 22:34:16,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 84/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.2727917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:16,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43374 samples/s/p 2:37:26 } +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 86/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 1.27218045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43118 samples/s/p 2:37:27 } +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 88/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.2715691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43490 samples/s/p 2:37:18 } +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 90/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.27095755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43278 samples/s/p 2:37:18 } +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 92/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.2703464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43659 samples/s/p 2:37:09 } +2024-07-25 22:34:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 94/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.2697354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43777 samples/s/p 2:37:04 } +2024-07-25 22:34:33,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 96/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.2691242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43298 samples/s/p 2:37:09 } +2024-07-25 22:34:36,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 98/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.2685128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:37,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43460 samples/s/p 2:37:04 } +2024-07-25 22:34:40,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 100/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.2679019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:40,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43840 samples/s/p 2:36:54 } +2024-07-25 22:34:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 102/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.2672909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43283 samples/s/p 2:37:01 } +2024-07-25 22:34:46,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 104/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.2666797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.44031 samples/s/p 2:36:45 } +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.266069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43441 samples/s/p 2:36:52 } +2024-07-25 22:34:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 108/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.2654583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:52,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43354 samples/s/p 2:36:51 } +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 110/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.2648473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43923 samples/s/p 2:36:38 } +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 112/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.2642366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43158 samples/s/p 2:36:48 } +2024-07-25 22:35:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 114/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.263626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43352 samples/s/p 2:36:42 } +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 116/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 1.2630152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43985 samples/s/p 2:36:28 } +2024-07-25 22:35:06,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 118/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2624045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43372 samples/s/p 2:36:36 } +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 120/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.2617941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.42874 samples/s/p 2:36:41 } +2024-07-25 22:35:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 122/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.2611835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43571 samples/s/p 2:36:26 } +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 124/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.2605732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43181 samples/s/p 2:36:30 } +2024-07-25 22:35:18,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 126/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.2599628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43798 samples/s/p 2:36:17 } +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 128/ 1625], loss: 0.983, per_step_time: 1471ms, lr: 1.2593522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43542 samples/s/p 2:36:18 } +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 130/ 1625], loss: 0.971, per_step_time: 1470ms, lr: 1.2587421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.44070 samples/s/p 2:36:06 } +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 132/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 1.25813185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:27,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43639 samples/s/p 2:36:10 } +2024-07-25 22:35:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 134/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2575216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:30,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43727 samples/s/p 2:36:06 } +2024-07-25 22:35:33,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 136/ 1625], loss: 0.975, per_step_time: 1472ms, lr: 1.2569116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:33,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43450 samples/s/p 2:36:08 } +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 138/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2563017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43207 samples/s/p 2:36:09 } +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 140/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2556915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:39,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43596 samples/s/p 2:35:59 } +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 142/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.2550816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.44008 samples/s/p 2:35:49 } +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 144/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2544717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:45,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43302 samples/s/p 2:35:59 } +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 146/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 1.2538619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43549 samples/s/p 2:35:51 } +2024-07-25 22:35:51,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 148/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 1.2532519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:51,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43939 samples/s/p 2:35:42 } +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 150/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.2526423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43315 samples/s/p 2:35:50 } +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 152/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 1.2520328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:56,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43439 samples/s/p 2:35:44 } +2024-07-25 22:35:59,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 154/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2514231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:59,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43494 samples/s/p 2:35:41 } +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 156/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 1.2508134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43543 samples/s/p 2:35:37 } +2024-07-25 22:36:05,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 158/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.2502041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:05,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43525 samples/s/p 2:35:34 } +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 160/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.2495944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43192 samples/s/p 2:35:37 } +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 162/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 1.248985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:11,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.44087 samples/s/p 2:35:19 } +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 164/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.2483758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42857 samples/s/p 2:35:37 } +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 166/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.2477663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43278 samples/s/p 2:35:27 } +2024-07-25 22:36:20,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 168/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.24715725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:20,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43263 samples/s/p 2:35:24 } +2024-07-25 22:36:23,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 170/ 1625], loss: 1.299, per_step_time: 1474ms, lr: 1.2465481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:23,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42704 samples/s/p 2:35:31 } +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 172/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.2459387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43216 samples/s/p 2:35:19 } +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 174/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2453298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43507 samples/s/p 2:35:11 } +2024-07-25 22:36:32,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 176/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.2447208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:32,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43174 samples/s/p 2:35:14 } +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 178/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.2441116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:35,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.42951 samples/s/p 2:35:15 } +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 180/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2435029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43767 samples/s/p 2:34:58 } +2024-07-25 22:36:41,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 182/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.2428942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:41,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43323 samples/s/p 2:35:02 } +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.2422852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43628 samples/s/p 2:34:54 } +2024-07-25 22:36:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 186/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.24167655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:47,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43555 samples/s/p 2:34:52 } +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 188/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.241068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43924 samples/s/p 2:34:43 } +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 190/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.2404592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43332 samples/s/p 2:34:50 } +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 192/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.23985055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43159 samples/s/p 2:34:50 } +2024-07-25 22:36:58,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 194/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.2392423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:58,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43858 samples/s/p 2:34:35 } +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 196/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.2386339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43734 samples/s/p 2:34:35 } +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 198/ 1625], loss: 1.417, per_step_time: 1472ms, lr: 1.2380254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43176 samples/s/p 2:34:41 } +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 200/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.237417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43735 samples/s/p 2:34:29 } +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 202/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.2368088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:10,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43965 samples/s/p 2:34:22 } +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 204/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2362005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43161 samples/s/p 2:34:33 } +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 206/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.2355923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43691 samples/s/p 2:34:21 } +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 208/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2349844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.44049 samples/s/p 2:34:12 } +2024-07-25 22:37:22,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 210/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.2343762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:22,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43312 samples/s/p 2:34:21 } +2024-07-25 22:37:25,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 212/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.2337684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:25,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43105 samples/s/p 2:34:22 } +2024-07-25 22:37:28,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 214/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.2331604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:28,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42675 samples/s/p 2:34:26 } +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 216/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.2325523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:31,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43651 samples/s/p 2:34:07 } +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 1.2319448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42708 samples/s/p 2:34:20 } +2024-07-25 22:37:37,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 220/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.2313371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:37,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43607 samples/s/p 2:34:01 } +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 222/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 1.2307292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.42893 samples/s/p 2:34:11 } +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 224/ 1625], loss: 0.964, per_step_time: 1483ms, lr: 1.2301216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.39267 samples/s/p 2:35:10 } +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 226/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.22951415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43482 samples/s/p 2:33:55 } +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 228/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 1.2289065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:49,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.44254 samples/s/p 2:33:39 } +2024-07-25 22:37:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 230/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.2282991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43703 samples/s/p 2:33:45 } +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 232/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.2276918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43786 samples/s/p 2:33:41 } +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 234/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2270843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:58,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43255 samples/s/p 2:33:47 } +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 236/ 1625], loss: 1.137, per_step_time: 1469ms, lr: 1.2264772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:00,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.44353 samples/s/p 2:33:25 } +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 238/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.2258699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:03,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43341 samples/s/p 2:33:39 } +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 240/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 1.2252626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:06,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43098 samples/s/p 2:33:41 } +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 242/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.2246556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.44018 samples/s/p 2:33:22 } +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 244/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.2240485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43459 samples/s/p 2:33:29 } +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.2234417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43178 samples/s/p 2:33:30 } +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 248/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.2228347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43771 samples/s/p 2:33:17 } +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 250/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.222228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:21,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43524 samples/s/p 2:33:19 } +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 252/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.2216211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:24,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43461 samples/s/p 2:33:17 } +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 254/ 1625], loss: 1.171, per_step_time: 1485ms, lr: 1.2210142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.38674 samples/s/p 2:34:36 } +2024-07-25 22:38:30,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 256/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.22040765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:30,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43705 samples/s/p 2:33:07 } +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 258/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.2198011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:33,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43341 samples/s/p 2:33:10 } +2024-07-25 22:38:36,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 260/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.2191943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:36,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43846 samples/s/p 2:32:59 } +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 262/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.218588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43177 samples/s/p 2:33:07 } +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 264/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.21798175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:42,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43607 samples/s/p 2:32:57 } +2024-07-25 22:38:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 266/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.2173752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43097 samples/s/p 2:33:02 } +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 268/ 1625], loss: 1.041, per_step_time: 1470ms, lr: 1.2167689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:48,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43893 samples/s/p 2:32:46 } +2024-07-25 22:38:51,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 270/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.2161628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:51,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.44171 samples/s/p 2:32:38 } +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 272/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.2155563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:54,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43540 samples/s/p 2:32:46 } +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 274/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.2149503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:57,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43312 samples/s/p 2:32:47 } +2024-07-25 22:39:00,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 276/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.2143444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:00,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43826 samples/s/p 2:32:35 } +2024-07-25 22:39:02,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 278/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 1.2137382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:02,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43848 samples/s/p 2:32:32 } +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 280/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.2131324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:05,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43684 samples/s/p 2:32:32 } +2024-07-25 22:39:08,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 282/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 1.2125265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:08,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43619 samples/s/p 2:32:30 } +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 284/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.2119205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43595 samples/s/p 2:32:27 } +2024-07-25 22:39:14,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 286/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.2113149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42857 samples/s/p 2:32:37 } +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 288/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.2107092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:17,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42996 samples/s/p 2:32:32 } +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 290/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.2101034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:20,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43415 samples/s/p 2:32:22 } +2024-07-25 22:39:23,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 292/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.209498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:23,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43412 samples/s/p 2:32:19 } +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 294/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.2088927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42797 samples/s/p 2:32:26 } +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 296/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2082872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:29,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43620 samples/s/p 2:32:09 } +2024-07-25 22:39:32,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 298/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.2076816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:32,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43253 samples/s/p 2:32:13 } +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 300/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.20707655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:35,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43691 samples/s/p 2:32:02 } +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 302/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 1.2064713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43663 samples/s/p 2:32:00 } +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 304/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.2058658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:41,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43611 samples/s/p 2:31:58 } +2024-07-25 22:39:44,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 306/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.2052609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:44,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43475 samples/s/p 2:31:57 } +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 308/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.204656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42972 samples/s/p 2:32:03 } +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 310/ 1625], loss: 1.238, per_step_time: 1469ms, lr: 1.2040508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44291 samples/s/p 2:31:38 } +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 312/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.2034459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:53,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43557 samples/s/p 2:31:47 } +2024-07-25 22:39:56,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 314/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.2028412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44052 samples/s/p 2:31:36 } +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 316/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.2022362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42967 samples/s/p 2:31:51 } +2024-07-25 22:40:01,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 318/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.2016315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:01,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43701 samples/s/p 2:31:36 } +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 320/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 1.20102695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.44074 samples/s/p 2:31:26 } +2024-07-25 22:40:07,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 322/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 1.2004221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43046 samples/s/p 2:31:41 } +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 324/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.1998178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43197 samples/s/p 2:31:35 } +2024-07-25 22:40:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 326/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.1992133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43780 samples/s/p 2:31:23 } +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 328/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.1986087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:16,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43376 samples/s/p 2:31:26 } +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 330/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1980044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:19,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43455 samples/s/p 2:31:22 } +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 332/ 1625], loss: 1.238, per_step_time: 1474ms, lr: 1.1974002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:22,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.42737 samples/s/p 2:31:31 } +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 334/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1967958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:25,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43361 samples/s/p 2:31:18 } +2024-07-25 22:40:28,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 336/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 1.1961917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:28,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43416 samples/s/p 2:31:14 } +2024-07-25 22:40:31,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 338/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.1955879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43696 samples/s/p 2:31:06 } +2024-07-25 22:40:34,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 340/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.1949837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:34,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43505 samples/s/p 2:31:07 } +2024-07-25 22:40:37,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 342/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.1943797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:37,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43533 samples/s/p 2:31:03 } +2024-07-25 22:40:40,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 344/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.1937759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:40,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43243 samples/s/p 2:31:05 } +2024-07-25 22:40:43,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 346/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.1931721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:43,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43266 samples/s/p 2:31:02 } +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 348/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1925681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43618 samples/s/p 2:30:53 } +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 1.1919647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.42910 samples/s/p 2:31:02 } +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 352/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.1913612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43333 samples/s/p 2:30:52 } +2024-07-25 22:40:55,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 354/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1907574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:55,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43421 samples/s/p 2:30:47 } +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 356/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 1.1901539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:58,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.44220 samples/s/p 2:30:31 } +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 358/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.1895506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:01,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43178 samples/s/p 2:30:46 } +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 360/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.1889471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43701 samples/s/p 2:30:34 } +2024-07-25 22:41:06,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 362/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1883438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:06,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43639 samples/s/p 2:30:32 } +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 364/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.1877407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43193 samples/s/p 2:30:36 } +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 366/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.1871373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43463 samples/s/p 2:30:29 } +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 368/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.1865344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43507 samples/s/p 2:30:25 } +2024-07-25 22:41:18,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 370/ 1625], loss: 1.003, per_step_time: 1472ms, lr: 1.1859313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:18,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43399 samples/s/p 2:30:24 } +2024-07-25 22:41:21,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 372/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.1853283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:21,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43870 samples/s/p 2:30:13 } +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 374/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1847255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:24,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43163 samples/s/p 2:30:22 } +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 376/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.1841228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:27,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43423 samples/s/p 2:30:15 } +2024-07-25 22:41:30,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 378/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.1835199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:30,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43156 samples/s/p 2:30:16 } +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 380/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 1.1829171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.42814 samples/s/p 2:30:19 } +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 382/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 1.1823147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43791 samples/s/p 2:30:00 } +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 384/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 1.181712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43870 samples/s/p 2:29:56 } +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 386/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 1.1811094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:42,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43712 samples/s/p 2:29:55 } +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 388/ 1625], loss: 1.060, per_step_time: 1468ms, lr: 1.1805072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.44634 samples/s/p 2:29:37 } +2024-07-25 22:41:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 390/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.1799047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43396 samples/s/p 2:29:55 } +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 392/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.1793026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:51,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43555 samples/s/p 2:29:49 } +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 394/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.1787003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:54,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43525 samples/s/p 2:29:47 } +2024-07-25 22:41:57,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 396/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.1780983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:57,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43428 samples/s/p 2:29:45 } +2024-07-25 22:42:00,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 398/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1774961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:00,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43142 samples/s/p 2:29:47 } +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 400/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.1768941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:02,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43166 samples/s/p 2:29:44 } +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 402/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.17629215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43747 samples/s/p 2:29:31 } +2024-07-25 22:42:08,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 404/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.17569025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:08,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43492 samples/s/p 2:29:33 } +2024-07-25 22:42:11,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 406/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.1750886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:11,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43309 samples/s/p 2:29:33 } +2024-07-25 22:42:14,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 408/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 1.1744868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:14,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44302 samples/s/p 2:29:13 } +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 410/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.173885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:17,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44054 samples/s/p 2:29:14 } +2024-07-25 22:42:20,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 412/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.17328345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:20,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43231 samples/s/p 2:29:25 } +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 414/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 1.1726819e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43630 samples/s/p 2:29:16 } +2024-07-25 22:42:26,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 416/ 1625], loss: 1.134, per_step_time: 1482ms, lr: 1.1720804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:26,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.39632 samples/s/p 2:30:19 } +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 418/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 1.1714791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43713 samples/s/p 2:29:08 } +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 420/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 1.1708779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.42820 samples/s/p 2:29:20 } +2024-07-25 22:42:35,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 422/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.1702766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:35,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43167 samples/s/p 2:29:11 } +2024-07-25 22:42:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 424/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.1696753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43644 samples/s/p 2:29:01 } +2024-07-25 22:42:41,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 426/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1690743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43471 samples/s/p 2:29:01 } +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 428/ 1625], loss: 1.312, per_step_time: 1477ms, lr: 1.1684731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.41582 samples/s/p 2:29:29 } +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 430/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.1678721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.44005 samples/s/p 2:28:46 } +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 432/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.1672715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43488 samples/s/p 2:28:51 } +2024-07-25 22:42:53,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 434/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.1666704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:53,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43336 samples/s/p 2:28:51 } +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 436/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.1660698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43422 samples/s/p 2:28:47 } +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 438/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 1.1654692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43466 samples/s/p 2:28:43 } +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 440/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.16486835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43526 samples/s/p 2:28:39 } +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 442/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.164268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43891 samples/s/p 2:28:30 } +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 444/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 1.1636675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43454 samples/s/p 2:28:34 } +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 446/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.1630674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43513 samples/s/p 2:28:30 } +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 448/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.1624667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:13,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43216 samples/s/p 2:28:32 } +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 450/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.1618667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:16,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43291 samples/s/p 2:28:28 } +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 452/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.1612665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43696 samples/s/p 2:28:19 } +2024-07-25 22:43:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 454/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.1606662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44002 samples/s/p 2:28:11 } +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 456/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.1600662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44080 samples/s/p 2:28:06 } +2024-07-25 22:43:28,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 458/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.1594662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:28,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43141 samples/s/p 2:28:19 } +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 460/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.1588663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43938 samples/s/p 2:28:03 } +2024-07-25 22:43:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 462/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1582666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:34,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43811 samples/s/p 2:28:02 } +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 464/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.157667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44112 samples/s/p 2:27:54 } +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 466/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.1570671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44027 samples/s/p 2:27:53 } +2024-07-25 22:43:43,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 468/ 1625], loss: 1.305, per_step_time: 1474ms, lr: 1.1564674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:43,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42521 samples/s/p 2:28:14 } +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 470/ 1625], loss: 1.021, per_step_time: 1469ms, lr: 1.1558682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:46,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44318 samples/s/p 2:27:42 } +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 472/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.15526855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:49,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43280 samples/s/p 2:27:56 } +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 474/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1546691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:52,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43490 samples/s/p 2:27:50 } +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 476/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.1540699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43090 samples/s/p 2:27:53 } +2024-07-25 22:43:58,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 478/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 1.1534705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:58,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43780 samples/s/p 2:27:39 } +2024-07-25 22:44:01,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 480/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.1528715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:01,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43541 samples/s/p 2:27:40 } +2024-07-25 22:44:03,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 482/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1522724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43773 samples/s/p 2:27:33 } +2024-07-25 22:44:06,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 484/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.1516731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:06,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.44002 samples/s/p 2:27:27 } +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 486/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.1510744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43489 samples/s/p 2:27:32 } +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 488/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 1.1504755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:12,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43898 samples/s/p 2:27:22 } +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 490/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1498765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:15,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43315 samples/s/p 2:27:29 } +2024-07-25 22:44:18,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.149278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.42906 samples/s/p 2:27:33 } +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 494/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 1.1486794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43104 samples/s/p 2:27:26 } +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 496/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.1480808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:24,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43525 samples/s/p 2:27:17 } +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 498/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.1474822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43035 samples/s/p 2:27:22 } +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 500/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.1468839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43005 samples/s/p 2:27:19 } +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 502/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.1462855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42891 samples/s/p 2:27:18 } +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 504/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.1456871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42928 samples/s/p 2:27:15 } +2024-07-25 22:44:39,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 506/ 1625], loss: 1.135, per_step_time: 1482ms, lr: 1.145089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:39,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.39695 samples/s/p 2:28:05 } +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 508/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.144491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:42,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43001 samples/s/p 2:27:07 } +2024-07-25 22:44:45,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 510/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.1438929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:45,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43282 samples/s/p 2:27:00 } +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 512/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.1432948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43715 samples/s/p 2:26:50 } +2024-07-25 22:44:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1426971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:51,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43442 samples/s/p 2:26:51 } +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 516/ 1625], loss: 1.334, per_step_time: 1470ms, lr: 1.142099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44132 samples/s/p 2:26:37 } +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 518/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.14150125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44344 samples/s/p 2:26:31 } +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 520/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.1409037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43489 samples/s/p 2:26:42 } +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 522/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.140306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43889 samples/s/p 2:26:32 } +2024-07-25 22:45:05,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 524/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.1397086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:05,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43759 samples/s/p 2:26:32 } +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 526/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.1391111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43540 samples/s/p 2:26:32 } +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 528/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.1385136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43652 samples/s/p 2:26:27 } +2024-07-25 22:45:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 530/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.1379165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:14,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44105 samples/s/p 2:26:17 } +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 532/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.1373192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43959 samples/s/p 2:26:17 } +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 534/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 1.136722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:20,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43381 samples/s/p 2:26:23 } +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 536/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.136125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:23,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43315 samples/s/p 2:26:21 } +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 538/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 1.13552815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:26,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.42768 samples/s/p 2:26:27 } +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 540/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.134931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43151 samples/s/p 2:26:18 } +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 542/ 1625], loss: 1.105, per_step_time: 1469ms, lr: 1.1343341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44268 samples/s/p 2:25:57 } +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 544/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.1337375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43235 samples/s/p 2:26:11 } +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 546/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1331409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43103 samples/s/p 2:26:10 } +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 548/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.1325442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43725 samples/s/p 2:25:57 } +2024-07-25 22:45:44,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 550/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.13194765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:44,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43154 samples/s/p 2:26:03 } +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 552/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.1313513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43827 samples/s/p 2:25:49 } +2024-07-25 22:45:50,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 554/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.13075475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:50,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43533 samples/s/p 2:25:51 } +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 556/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 1.1301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:53,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43957 samples/s/p 2:25:41 } +2024-07-25 22:45:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 558/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.1295624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43080 samples/s/p 2:25:53 } +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 560/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 1.1289661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:59,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43311 samples/s/p 2:25:46 } +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 562/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.12837015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.44158 samples/s/p 2:25:29 } +2024-07-25 22:46:05,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 564/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 1.1277741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:05,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43341 samples/s/p 2:25:40 } +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 566/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.127178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:07,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43382 samples/s/p 2:25:36 } +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 568/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.1265823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:10,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43805 samples/s/p 2:25:26 } +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 570/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 1.1259866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43743 samples/s/p 2:25:24 } +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 572/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.1253907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:16,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43449 samples/s/p 2:25:26 } +2024-07-25 22:46:19,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 574/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.1247953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:19,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43918 samples/s/p 2:25:16 } +2024-07-25 22:46:22,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 576/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.1241998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:22,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43672 samples/s/p 2:25:17 } +2024-07-25 22:46:25,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 578/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.1236043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:25,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42755 samples/s/p 2:25:28 } +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 580/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1230089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43425 samples/s/p 2:25:15 } +2024-07-25 22:46:31,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 582/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.1224138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:31,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42909 samples/s/p 2:25:20 } +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 584/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1218183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43403 samples/s/p 2:25:09 } +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 586/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.12122325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43251 samples/s/p 2:25:09 } +2024-07-25 22:46:40,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 588/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.12062835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:40,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43768 samples/s/p 2:24:57 } +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 590/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 1.1200332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43092 samples/s/p 2:25:05 } +2024-07-25 22:46:46,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 592/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.1194385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:46,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43496 samples/s/p 2:24:56 } +2024-07-25 22:46:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 594/ 1625], loss: 0.902, per_step_time: 1469ms, lr: 1.11884365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44580 samples/s/p 2:24:36 } +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 596/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.118249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:52,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43663 samples/s/p 2:24:47 } +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 598/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.1176542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43920 samples/s/p 2:24:40 } +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 600/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.1170596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:58,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43093 samples/s/p 2:24:50 } +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 602/ 1625], loss: 1.317, per_step_time: 1474ms, lr: 1.1164652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42611 samples/s/p 2:24:55 } +2024-07-25 22:47:04,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 604/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 1.1158707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:04,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43018 samples/s/p 2:24:46 } +2024-07-25 22:47:06,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 606/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.1152764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:06,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43983 samples/s/p 2:24:27 } +2024-07-25 22:47:09,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 608/ 1625], loss: 1.287, per_step_time: 1470ms, lr: 1.1146822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:09,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44043 samples/s/p 2:24:24 } +2024-07-25 22:47:12,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 610/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.1140879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:12,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43165 samples/s/p 2:24:35 } +2024-07-25 22:47:15,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 612/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.1134939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:15,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43685 samples/s/p 2:24:23 } +2024-07-25 22:47:18,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 614/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.1128999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:18,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43695 samples/s/p 2:24:20 } +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 616/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1123058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:21,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43317 samples/s/p 2:24:23 } +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 618/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.111712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:24,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43330 samples/s/p 2:24:20 } +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 620/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.1111185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43309 samples/s/p 2:24:18 } +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 622/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 1.1105246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43926 samples/s/p 2:24:05 } +2024-07-25 22:47:33,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 624/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.109931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:33,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43547 samples/s/p 2:24:08 } +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 626/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.1093375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43215 samples/s/p 2:24:10 } +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 628/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.108744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43156 samples/s/p 2:24:08 } +2024-07-25 22:47:42,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 630/ 1625], loss: 0.976, per_step_time: 1469ms, lr: 1.1081505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:42,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44248 samples/s/p 2:23:48 } +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 632/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.10755755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:45,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43564 samples/s/p 2:23:56 } +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 634/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.1069641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43473 samples/s/p 2:23:54 } +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 636/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.1063711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43534 samples/s/p 2:23:50 } +2024-07-25 22:47:54,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 638/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.105778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44060 samples/s/p 2:23:39 } +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 640/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.10518495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:57,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43500 samples/s/p 2:23:45 } +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 642/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.1045922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:00,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43294 samples/s/p 2:23:45 } +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 644/ 1625], loss: 1.153, per_step_time: 1482ms, lr: 1.1039994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.39509 samples/s/p 2:24:43 } +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 646/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.1034069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:06,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43439 samples/s/p 2:23:37 } +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 648/ 1625], loss: 1.085, per_step_time: 1469ms, lr: 1.1028141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:08,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.44412 samples/s/p 2:23:19 } +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 650/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 1.1022217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43911 samples/s/p 2:23:24 } +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 652/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.1016292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43281 samples/s/p 2:23:31 } +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 654/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.10103665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43080 samples/s/p 2:23:31 } +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 656/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.1004445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:20,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43821 samples/s/p 2:23:16 } +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 658/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.0998522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:23,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43298 samples/s/p 2:23:22 } +2024-07-25 22:48:26,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 660/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.09926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:26,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43402 samples/s/p 2:23:17 } +2024-07-25 22:48:29,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 662/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.098668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:29,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43690 samples/s/p 2:23:10 } +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 664/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.0980762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43525 samples/s/p 2:23:09 } +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 666/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 1.0974843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:35,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43519 samples/s/p 2:23:07 } +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 668/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.0968924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43701 samples/s/p 2:23:01 } +2024-07-25 22:48:41,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 670/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.0963008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:41,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.44162 samples/s/p 2:22:50 } +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 672/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 1.095709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.42992 samples/s/p 2:23:06 } +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 674/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 1.0951174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43521 samples/s/p 2:22:55 } +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 676/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.0945262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43490 samples/s/p 2:22:52 } +2024-07-25 22:48:53,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 678/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.0939346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:53,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43828 samples/s/p 2:22:44 } +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 680/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.0933434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:56,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43367 samples/s/p 2:22:48 } +2024-07-25 22:48:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 682/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.0927522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43049 samples/s/p 2:22:50 } +2024-07-25 22:49:02,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 684/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0921609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:02,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43486 samples/s/p 2:22:41 } +2024-07-25 22:49:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 686/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 1.0915701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:05,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43131 samples/s/p 2:22:43 } +2024-07-25 22:49:07,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 688/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.0909791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:07,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43271 samples/s/p 2:22:38 } +2024-07-25 22:49:10,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 690/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.0903882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:10,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43699 samples/s/p 2:22:28 } +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 692/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.0897974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:13,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43883 samples/s/p 2:22:23 } +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 694/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.08920685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43640 samples/s/p 2:22:23 } +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 696/ 1625], loss: 1.368, per_step_time: 1472ms, lr: 1.088616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43458 samples/s/p 2:22:23 } +2024-07-25 22:49:22,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 698/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0880255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:22,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43579 samples/s/p 2:22:18 } +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 700/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.0874353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:25,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43536 samples/s/p 2:22:16 } +2024-07-25 22:49:28,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 702/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.086845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:28,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43273 samples/s/p 2:22:17 } +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 704/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0862545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43448 samples/s/p 2:22:12 } +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 706/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.0856644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43078 samples/s/p 2:22:15 } +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 708/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 1.0850745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42947 samples/s/p 2:22:14 } +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 710/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.0844842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:40,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43843 samples/s/p 2:21:57 } +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.0838942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:43,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43867 samples/s/p 2:21:53 } +2024-07-25 22:49:46,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 714/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.0833046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:46,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42886 samples/s/p 2:22:06 } +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 716/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.0827147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43384 samples/s/p 2:21:55 } +2024-07-25 22:49:52,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 718/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.0821252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:52,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43734 samples/s/p 2:21:47 } +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 720/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.08153545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.44578 samples/s/p 2:21:30 } +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 722/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 1.0809458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43947 samples/s/p 2:21:37 } +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 724/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.0803566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43085 samples/s/p 2:21:48 } +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 726/ 1625], loss: 0.949, per_step_time: 1472ms, lr: 1.0797673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43252 samples/s/p 2:21:42 } +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 728/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.0791779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43385 samples/s/p 2:21:37 } +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 730/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.0785889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:09,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43841 samples/s/p 2:21:27 } +2024-07-25 22:50:12,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 732/ 1625], loss: 1.101, per_step_time: 1474ms, lr: 1.0779999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:12,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.42602 samples/s/p 2:21:44 } +2024-07-25 22:50:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 734/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.0774107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44012 samples/s/p 2:21:19 } +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 736/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.0768219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43084 samples/s/p 2:21:30 } +2024-07-25 22:50:21,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 738/ 1625], loss: 1.001, per_step_time: 1470ms, lr: 1.0762332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:21,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44085 samples/s/p 2:21:12 } +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 740/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0756443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:24,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43598 samples/s/p 2:21:16 } +2024-07-25 22:50:27,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 742/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.0750557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43169 samples/s/p 2:21:20 } +2024-07-25 22:50:30,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 744/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.0744673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:30,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43692 samples/s/p 2:21:09 } +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 746/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 1.0738787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.42903 samples/s/p 2:21:18 } +2024-07-25 22:50:36,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 748/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.0732904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:36,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43337 samples/s/p 2:21:09 } +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 750/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0727022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43636 samples/s/p 2:21:01 } +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 752/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 1.0721141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43280 samples/s/p 2:21:04 } +2024-07-25 22:50:45,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 754/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0715258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:45,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43637 samples/s/p 2:20:55 } +2024-07-25 22:50:48,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 756/ 1625], loss: 0.860, per_step_time: 1471ms, lr: 1.0709378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43848 samples/s/p 2:20:49 } +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 758/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.07035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42993 samples/s/p 2:20:59 } +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 760/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 1.069762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.44226 samples/s/p 2:20:37 } +2024-07-25 22:50:57,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 762/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 1.0691743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:57,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43022 samples/s/p 2:20:53 } +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 764/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0685868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42996 samples/s/p 2:20:50 } +2024-07-25 22:51:03,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 766/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.067999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:03,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43244 samples/s/p 2:20:44 } +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 768/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.0674116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:06,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42910 samples/s/p 2:20:46 } +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 770/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.0668243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43197 samples/s/p 2:20:38 } +2024-07-25 22:51:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 772/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.0662368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:11,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43777 samples/s/p 2:20:26 } +2024-07-25 22:51:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 774/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 1.0656497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43283 samples/s/p 2:20:31 } +2024-07-25 22:51:17,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 776/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.0650628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:17,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43117 samples/s/p 2:20:31 } +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 778/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0644755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43786 samples/s/p 2:20:18 } +2024-07-25 22:51:23,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 780/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.0638886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:23,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43028 samples/s/p 2:20:26 } +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 782/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 1.0633018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43577 samples/s/p 2:20:15 } +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 784/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.062715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43103 samples/s/p 2:20:19 } +2024-07-25 22:51:32,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 786/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 1.0621283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:32,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43013 samples/s/p 2:20:18 } +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 788/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.0615418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43216 samples/s/p 2:20:12 } +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 790/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.0609552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43497 samples/s/p 2:20:04 } +2024-07-25 22:51:41,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 792/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.0603689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:41,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43755 samples/s/p 2:19:57 } +2024-07-25 22:51:44,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 794/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 1.0597825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:44,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43094 samples/s/p 2:20:05 } +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 796/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0591963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43224 samples/s/p 2:20:00 } +2024-07-25 22:51:50,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 798/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0586102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:50,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43332 samples/s/p 2:19:55 } +2024-07-25 22:51:53,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 800/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0580241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:53,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43697 samples/s/p 2:19:47 } +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 802/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.0574383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43380 samples/s/p 2:19:48 } +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 804/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0568523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43703 samples/s/p 2:19:41 } +2024-07-25 22:52:02,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 806/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 1.0562667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:02,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43149 samples/s/p 2:19:46 } +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 808/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 1.055681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43537 samples/s/p 2:19:37 } +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 810/ 1625], loss: 0.900, per_step_time: 1470ms, lr: 1.05509525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:08,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.44008 samples/s/p 2:19:27 } +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 812/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.0545098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43579 samples/s/p 2:19:31 } +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 814/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0539245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43285 samples/s/p 2:19:32 } +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 816/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0533389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43673 samples/s/p 2:19:23 } +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 818/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 1.05275385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43558 samples/s/p 2:19:22 } +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 820/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.0521689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43847 samples/s/p 2:19:15 } +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 822/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.0515838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43496 samples/s/p 2:19:17 } +2024-07-25 22:52:28,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 824/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 1.0509987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:28,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43355 samples/s/p 2:19:16 } +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 826/ 1625], loss: 1.294, per_step_time: 1474ms, lr: 1.0504141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.42543 samples/s/p 2:19:26 } +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 828/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.0498291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43225 samples/s/p 2:19:13 } +2024-07-25 22:52:37,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 830/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.0492444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:37,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43572 samples/s/p 2:19:04 } +2024-07-25 22:52:40,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 832/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0486599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:40,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43512 samples/s/p 2:19:02 } +2024-07-25 22:52:43,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 834/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0480753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:43,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43708 samples/s/p 2:18:56 } +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 836/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.04749115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43951 samples/s/p 2:18:50 } +2024-07-25 22:52:49,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 838/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0469068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:49,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43551 samples/s/p 2:18:53 } +2024-07-25 22:52:52,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 840/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 1.04632245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:52,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43867 samples/s/p 2:18:45 } +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 842/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.0457384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43910 samples/s/p 2:18:41 } +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 844/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.0451544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44066 samples/s/p 2:18:36 } +2024-07-25 22:53:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 846/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0445704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43581 samples/s/p 2:18:41 } +2024-07-25 22:53:04,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 848/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0439867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:04,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43818 samples/s/p 2:18:34 } +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 850/ 1625], loss: 1.063, per_step_time: 1469ms, lr: 1.043403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44315 samples/s/p 2:18:24 } +2024-07-25 22:53:09,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 852/ 1625], loss: 1.396, per_step_time: 1472ms, lr: 1.0428194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:09,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43407 samples/s/p 2:18:34 } +2024-07-25 22:53:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 854/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.0422356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:12,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43526 samples/s/p 2:18:30 } +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 856/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.0416523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43897 samples/s/p 2:18:21 } +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 858/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0410689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43452 samples/s/p 2:18:25 } +2024-07-25 22:53:21,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 860/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.0404857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:21,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43552 samples/s/p 2:18:20 } +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 862/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0399025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.44052 samples/s/p 2:18:10 } +2024-07-25 22:53:27,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 864/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0393195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:27,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43780 samples/s/p 2:18:11 } +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 866/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 1.03873645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:30,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43157 samples/s/p 2:18:18 } +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 868/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0381535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:33,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43539 samples/s/p 2:18:09 } +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 870/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.03757075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43409 samples/s/p 2:18:08 } +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 872/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.036988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:39,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43742 samples/s/p 2:18:00 } +2024-07-25 22:53:42,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 874/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.0364055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:42,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43853 samples/s/p 2:17:55 } +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 876/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.035823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44344 samples/s/p 2:17:45 } +2024-07-25 22:53:48,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 878/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.03524035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:48,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43742 samples/s/p 2:17:51 } +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 880/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 1.0346582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:51,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44124 samples/s/p 2:17:42 } +2024-07-25 22:53:54,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 882/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.0340759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:54,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44165 samples/s/p 2:17:39 } +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 884/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 1.0334936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:57,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43321 samples/s/p 2:17:49 } +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 886/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.0329118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43385 samples/s/p 2:17:45 } +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 888/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.03233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:03,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43031 samples/s/p 2:17:47 } +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 890/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.031748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43486 samples/s/p 2:17:37 } +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 892/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.0311662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:08,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43159 samples/s/p 2:17:39 } +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 894/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0305846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43202 samples/s/p 2:17:36 } +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 896/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0300029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.44186 samples/s/p 2:17:18 } +2024-07-25 22:54:17,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 898/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.0294214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:17,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43037 samples/s/p 2:17:32 } +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 900/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 1.0288402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.42838 samples/s/p 2:17:32 } +2024-07-25 22:54:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 902/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.0282591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:23,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43777 samples/s/p 2:17:15 } +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 904/ 1625], loss: 1.455, per_step_time: 1470ms, lr: 1.0276777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44109 samples/s/p 2:17:07 } +2024-07-25 22:54:29,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 906/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 1.0270966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:29,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43642 samples/s/p 2:17:11 } +2024-07-25 22:54:32,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 908/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.0265158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:32,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44014 samples/s/p 2:17:03 } +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 910/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 1.0259348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43038 samples/s/p 2:17:15 } +2024-07-25 22:54:38,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 912/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.025354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:38,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43559 samples/s/p 2:17:04 } +2024-07-25 22:54:41,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 914/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0247734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:41,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43300 samples/s/p 2:17:05 } +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 916/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.0241926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44118 samples/s/p 2:16:49 } +2024-07-25 22:54:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 918/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0236123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:47,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44210 samples/s/p 2:16:45 } +2024-07-25 22:54:50,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 920/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 1.0230318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:50,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43492 samples/s/p 2:16:53 } +2024-07-25 22:54:53,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 922/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.0224514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:53,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43987 samples/s/p 2:16:43 } +2024-07-25 22:54:56,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 924/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.0218713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:56,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43126 samples/s/p 2:16:53 } +2024-07-25 22:54:59,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 926/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.0212912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43446 samples/s/p 2:16:45 } +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 928/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.020711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:02,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43722 samples/s/p 2:16:38 } +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 930/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.0201312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:05,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43701 samples/s/p 2:16:35 } +2024-07-25 22:55:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 932/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.0195516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43677 samples/s/p 2:16:33 } +2024-07-25 22:55:10,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 934/ 1625], loss: 1.258, per_step_time: 1475ms, lr: 1.0189717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:10,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.42216 samples/s/p 2:16:52 } +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 936/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.01839205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:13,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43051 samples/s/p 2:16:36 } +2024-07-25 22:55:16,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 938/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.0178127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:16,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43450 samples/s/p 2:16:27 } +2024-07-25 22:55:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 940/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.017233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:19,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43487 samples/s/p 2:16:24 } +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 942/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.0166537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43597 samples/s/p 2:16:19 } +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 944/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 1.0160747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.42979 samples/s/p 2:16:25 } +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 946/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.0154953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:28,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.44038 samples/s/p 2:16:07 } +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 948/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.0149164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43391 samples/s/p 2:16:13 } +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 950/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.0143374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:34,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43803 samples/s/p 2:16:04 } +2024-07-25 22:55:37,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 952/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.0137587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:37,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43672 samples/s/p 2:16:03 } +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 954/ 1625], loss: 1.328, per_step_time: 1470ms, lr: 1.0131798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44119 samples/s/p 2:15:54 } +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 956/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.0126013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43079 samples/s/p 2:16:06 } +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 958/ 1625], loss: 1.029, per_step_time: 1470ms, lr: 1.0120229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43879 samples/s/p 2:15:51 } +2024-07-25 22:55:49,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 960/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0114442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:49,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43504 samples/s/p 2:15:54 } +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 962/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.0108661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43459 samples/s/p 2:15:52 } +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 964/ 1625], loss: 1.234, per_step_time: 1469ms, lr: 1.0102878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44264 samples/s/p 2:15:37 } +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 966/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0097095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43650 samples/s/p 2:15:43 } +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 968/ 1625], loss: 1.263, per_step_time: 1470ms, lr: 1.0091317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.44044 samples/s/p 2:15:34 } +2024-07-25 22:56:04,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 970/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.0085536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:04,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43419 samples/s/p 2:15:41 } +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 972/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.0079756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:07,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43364 samples/s/p 2:15:38 } +2024-07-25 22:56:09,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 974/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.0073981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:09,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43863 samples/s/p 2:15:28 } +2024-07-25 22:56:12,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 976/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.00682055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:12,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43440 samples/s/p 2:15:31 } +2024-07-25 22:56:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 978/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0062429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43831 samples/s/p 2:15:23 } +2024-07-25 22:56:18,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 980/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 1.0056654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:18,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43393 samples/s/p 2:15:26 } +2024-07-25 22:56:21,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 982/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0050881e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:21,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43190 samples/s/p 2:15:26 } +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 984/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0045107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43567 samples/s/p 2:15:18 } +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 986/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.0039336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43477 samples/s/p 2:15:16 } +2024-07-25 22:56:30,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 988/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0033567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:30,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43383 samples/s/p 2:15:15 } +2024-07-25 22:56:33,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 990/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.0027797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:33,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.42901 samples/s/p 2:15:19 } +2024-07-25 22:56:36,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 992/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.00220295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:36,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43115 samples/s/p 2:15:13 } +2024-07-25 22:56:39,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 994/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 1.00162615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:39,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43115 samples/s/p 2:15:10 } +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 996/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.00104935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43758 samples/s/p 2:14:57 } +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 998/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.0004731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43539 samples/s/p 2:14:58 } +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1000/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 9.998966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43794 samples/s/p 2:14:51 } +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1002/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 9.993204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.44126 samples/s/p 2:14:43 } +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1004/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 9.9874405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43730 samples/s/p 2:14:46 } +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1006/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 9.981681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43558 samples/s/p 2:14:45 } +2024-07-25 22:57:00,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1008/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 9.975919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:00,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43170 samples/s/p 2:14:48 } +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1010/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 9.970159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43112 samples/s/p 2:14:46 } +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1012/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.964402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:06,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43979 samples/s/p 2:14:30 } +2024-07-25 22:57:08,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1014/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 9.958644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:08,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43475 samples/s/p 2:14:35 } +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1016/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 9.952889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43796 samples/s/p 2:14:27 } +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1018/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 9.9471345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43682 samples/s/p 2:14:26 } +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1020/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 9.941381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43591 samples/s/p 2:14:24 } +2024-07-25 22:57:20,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1022/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 9.935626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:20,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43954 samples/s/p 2:14:16 } +2024-07-25 22:57:23,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1024/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 9.929874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:23,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43287 samples/s/p 2:14:23 } +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1026/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.924124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43390 samples/s/p 2:14:19 } +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1028/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 9.918373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43312 samples/s/p 2:14:17 } +2024-07-25 22:57:32,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1030/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 9.9126255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:32,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43765 samples/s/p 2:14:07 } +2024-07-25 22:57:35,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1032/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 9.906877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:35,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43300 samples/s/p 2:14:11 } +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1034/ 1625], loss: 1.413, per_step_time: 1471ms, lr: 9.901129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43622 samples/s/p 2:14:03 } +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1036/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 9.895383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43837 samples/s/p 2:13:57 } +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1038/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 9.88964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43409 samples/s/p 2:14:01 } +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1040/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 9.883894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:47,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43417 samples/s/p 2:13:58 } +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1042/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 9.878152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:50,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43653 samples/s/p 2:13:51 } +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1044/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 9.872412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43452 samples/s/p 2:13:51 } +2024-07-25 22:57:56,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1046/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 9.866669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:56,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.42798 samples/s/p 2:13:58 } +2024-07-25 22:57:59,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1048/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 9.860931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:59,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43365 samples/s/p 2:13:47 } +2024-07-25 22:58:02,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1050/ 1625], loss: 0.856, per_step_time: 1471ms, lr: 9.855194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:02,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43820 samples/s/p 2:13:37 } +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1052/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 9.849455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43803 samples/s/p 2:13:34 } +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1054/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 9.843717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43312 samples/s/p 2:13:38 } +2024-07-25 22:58:10,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1056/ 1625], loss: 1.144, per_step_time: 1469ms, lr: 9.837982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:10,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.44253 samples/s/p 2:13:22 } +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1058/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 9.83225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43437 samples/s/p 2:13:31 } +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1060/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 9.826515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43468 samples/s/p 2:13:27 } +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1062/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 9.820782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43290 samples/s/p 2:13:27 } +2024-07-25 22:58:22,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1064/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 9.815052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:22,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43250 samples/s/p 2:13:25 } +2024-07-25 22:58:25,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1066/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 9.8093205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:25,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.44053 samples/s/p 2:13:10 } +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1068/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 9.803592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:28,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.42315 samples/s/p 2:13:33 } +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1070/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 9.797865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:31,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43200 samples/s/p 2:13:17 } +2024-07-25 22:58:34,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1072/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 9.792137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:34,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43830 samples/s/p 2:13:04 } +2024-07-25 22:58:37,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1074/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 9.786411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:37,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43595 samples/s/p 2:13:05 } +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1076/ 1625], loss: 1.238, per_step_time: 1476ms, lr: 9.780687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.41892 samples/s/p 2:13:27 } +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1078/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 9.774961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43675 samples/s/p 2:12:58 } +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1080/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 9.769238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43679 samples/s/p 2:12:55 } +2024-07-25 22:58:49,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1082/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 9.7635175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:49,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43572 samples/s/p 2:12:53 } +2024-07-25 22:58:52,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1084/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.757795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:52,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43680 samples/s/p 2:12:49 } +2024-07-25 22:58:55,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1086/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 9.752076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:55,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44039 samples/s/p 2:12:41 } +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1088/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 9.74636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:58,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44136 samples/s/p 2:12:36 } +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1090/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 9.74064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44091 samples/s/p 2:12:34 } +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1092/ 1625], loss: 0.914, per_step_time: 1470ms, lr: 9.734924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:04,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44125 samples/s/p 2:12:31 } +2024-07-25 22:59:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1094/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 9.72921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:07,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43641 samples/s/p 2:12:35 } +2024-07-25 22:59:09,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1096/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 9.723492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:09,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43479 samples/s/p 2:12:34 } +2024-07-25 22:59:12,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1098/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 9.71778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:12,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43147 samples/s/p 2:12:36 } +2024-07-25 22:59:15,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1100/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 9.712069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:15,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43438 samples/s/p 2:12:29 } +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1102/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 9.706359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43043 samples/s/p 2:12:32 } +2024-07-25 22:59:21,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1104/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 9.700648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:21,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42556 samples/s/p 2:12:36 } +2024-07-25 22:59:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1106/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 9.694939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:24,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43144 samples/s/p 2:12:24 } +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1108/ 1625], loss: 1.100, per_step_time: 1475ms, lr: 9.689233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42264 samples/s/p 2:12:34 } +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1110/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 9.683524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43392 samples/s/p 2:12:15 } +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1112/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 9.677818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:33,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43427 samples/s/p 2:12:11 } +2024-07-25 22:59:36,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1114/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 9.672114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:36,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43881 samples/s/p 2:12:02 } +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1116/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 9.66641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:39,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43719 samples/s/p 2:12:01 } +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1118/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 9.660708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43575 samples/s/p 2:12:00 } +2024-07-25 22:59:45,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1120/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.655007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:45,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43743 samples/s/p 2:11:55 } +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1122/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.649304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43556 samples/s/p 2:11:55 } +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1124/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 9.643607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43870 samples/s/p 2:11:47 } +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1126/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 9.637908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:54,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42855 samples/s/p 2:11:59 } +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1128/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 9.632209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:57,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42827 samples/s/p 2:11:57 } +2024-07-25 23:00:00,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1130/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 9.626515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:00,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43131 samples/s/p 2:11:49 } +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1132/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.620821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:03,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43951 samples/s/p 2:11:34 } +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1134/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 9.615126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43220 samples/s/p 2:11:42 } +2024-07-25 23:00:09,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1136/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 9.609432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:09,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.42673 samples/s/p 2:11:47 } +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1138/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 9.603742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43888 samples/s/p 2:11:26 } +2024-07-25 23:00:14,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1140/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 9.5980495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:14,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43717 samples/s/p 2:11:26 } +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1142/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 9.592361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43688 samples/s/p 2:11:23 } +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1144/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 9.586673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43145 samples/s/p 2:11:28 } +2024-07-25 23:00:23,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1146/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 9.580984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:23,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43010 samples/s/p 2:11:27 } +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1148/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 9.5752985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43800 samples/s/p 2:11:13 } +2024-07-25 23:00:29,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1150/ 1625], loss: 1.355, per_step_time: 1470ms, lr: 9.569613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:29,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43911 samples/s/p 2:11:08 } +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1152/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 9.563931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:32,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42969 samples/s/p 2:11:19 } +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1154/ 1625], loss: 1.064, per_step_time: 1469ms, lr: 9.558246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:35,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.44249 samples/s/p 2:10:58 } +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1156/ 1625], loss: 0.959, per_step_time: 1472ms, lr: 9.552564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43198 samples/s/p 2:11:10 } +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1158/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 9.546885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:41,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43230 samples/s/p 2:11:07 } +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1160/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 9.541203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42843 samples/s/p 2:11:09 } +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1162/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.535527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43821 samples/s/p 2:10:52 } +2024-07-25 23:00:50,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1164/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 9.529848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:50,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43374 samples/s/p 2:10:56 } +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1166/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 9.52417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43184 samples/s/p 2:10:55 } +2024-07-25 23:00:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1168/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 9.518497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.42823 samples/s/p 2:10:58 } +2024-07-25 23:00:59,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1170/ 1625], loss: 1.179, per_step_time: 1469ms, lr: 9.5128225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:59,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44309 samples/s/p 2:10:33 } +2024-07-25 23:01:02,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1172/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.507149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:02,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43853 samples/s/p 2:10:37 } +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1174/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 9.5014775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43537 samples/s/p 2:10:39 } +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1176/ 1625], loss: 0.935, per_step_time: 1469ms, lr: 9.495808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:08,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44572 samples/s/p 2:10:21 } +2024-07-25 23:01:10,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1178/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 9.490135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:10,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43533 samples/s/p 2:10:33 } +2024-07-25 23:01:13,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1180/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 9.484467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43466 samples/s/p 2:10:31 } +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1182/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 9.478801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:16,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43547 samples/s/p 2:10:27 } +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1184/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 9.473134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43058 samples/s/p 2:10:31 } +2024-07-25 23:01:22,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1186/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 9.46747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43556 samples/s/p 2:10:21 } +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1188/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 9.461806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43941 samples/s/p 2:10:12 } +2024-07-25 23:01:28,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1190/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 9.45614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:28,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43303 samples/s/p 2:10:18 } +2024-07-25 23:01:31,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1192/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 9.450478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42794 samples/s/p 2:10:23 } +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1194/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 9.4448205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43365 samples/s/p 2:10:12 } +2024-07-25 23:01:37,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1196/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 9.439157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:37,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43713 samples/s/p 2:10:04 } +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1198/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 9.433498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:40,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43639 samples/s/p 2:10:02 } +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1200/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 9.427843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42865 samples/s/p 2:10:10 } +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1202/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 9.422187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43572 samples/s/p 2:09:57 } +2024-07-25 23:01:49,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1204/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 9.416531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:49,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43680 samples/s/p 2:09:52 } +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1206/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 9.410877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42865 samples/s/p 2:10:01 } +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1208/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 9.405225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43324 samples/s/p 2:09:52 } +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1210/ 1625], loss: 0.981, per_step_time: 1471ms, lr: 9.399572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43631 samples/s/p 2:09:44 } +2024-07-25 23:02:01,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1212/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 9.393922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:01,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43444 samples/s/p 2:09:44 } +2024-07-25 23:02:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1214/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 9.388271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:04,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44179 samples/s/p 2:09:30 } +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1216/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 9.382622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43452 samples/s/p 2:09:38 } +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1218/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 9.376975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44160 samples/s/p 2:09:25 } +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1220/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.371329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:12,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43826 samples/s/p 2:09:27 } +2024-07-25 23:02:15,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1222/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 9.365684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:15,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43978 samples/s/p 2:09:22 } +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1224/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 9.36004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43643 samples/s/p 2:09:23 } +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1226/ 1625], loss: 0.925, per_step_time: 1471ms, lr: 9.354397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43718 samples/s/p 2:09:19 } +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1228/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 9.348755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:24,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43967 samples/s/p 2:09:13 } +2024-07-25 23:02:27,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1230/ 1625], loss: 0.979, per_step_time: 1469ms, lr: 9.3431145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:27,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.44353 samples/s/p 2:09:04 } +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1232/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 9.337477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.44011 samples/s/p 2:09:06 } +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1234/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 9.331837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43069 samples/s/p 2:09:17 } +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1236/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 9.326199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:36,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43231 samples/s/p 2:09:12 } +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1238/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 9.320565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43195 samples/s/p 2:09:09 } +2024-07-25 23:02:42,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1240/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 9.314927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:42,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43543 samples/s/p 2:09:01 } +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1242/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.309294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43198 samples/s/p 2:09:03 } +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1244/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 9.303664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:48,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43576 samples/s/p 2:08:55 } +2024-07-25 23:02:51,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1246/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 9.29803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:51,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43465 samples/s/p 2:08:54 } +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1248/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 9.292402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43765 samples/s/p 2:08:46 } +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1250/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 9.286772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:57,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43598 samples/s/p 2:08:46 } +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1252/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.281144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:00,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43099 samples/s/p 2:08:50 } +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1254/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 9.275517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43954 samples/s/p 2:08:35 } +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1256/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 9.269891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.44060 samples/s/p 2:08:30 } +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1258/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 9.264267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.42969 samples/s/p 2:08:43 } +2024-07-25 23:03:11,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1260/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 9.258643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43902 samples/s/p 2:08:27 } +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1262/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 9.25302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:14,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43144 samples/s/p 2:08:35 } +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1264/ 1625], loss: 1.306, per_step_time: 1470ms, lr: 9.247399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:17,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43852 samples/s/p 2:08:22 } +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1266/ 1625], loss: 1.116, per_step_time: 1469ms, lr: 9.2417795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.44219 samples/s/p 2:08:13 } +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1268/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 9.236161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43440 samples/s/p 2:08:22 } +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1270/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.230546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43448 samples/s/p 2:08:18 } +2024-07-25 23:03:29,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1272/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 9.2249265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:29,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43785 samples/s/p 2:08:11 } +2024-07-25 23:03:32,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1274/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 9.21931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:32,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43838 samples/s/p 2:08:07 } +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1276/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 9.2137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42917 samples/s/p 2:08:17 } +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1278/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 9.208084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43524 samples/s/p 2:08:06 } +2024-07-25 23:03:41,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1280/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 9.202471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:41,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43922 samples/s/p 2:07:57 } +2024-07-25 23:03:44,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1282/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.196864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:44,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43560 samples/s/p 2:07:59 } +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1284/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 9.191251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43425 samples/s/p 2:07:58 } +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1286/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 9.1856455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:50,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43412 samples/s/p 2:07:55 } +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1288/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 9.180038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42342 samples/s/p 2:08:08 } +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1290/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 9.174429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43131 samples/s/p 2:07:54 } +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1292/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.168827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:59,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43252 samples/s/p 2:07:49 } +2024-07-25 23:04:02,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1294/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 9.163223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:02,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.42923 samples/s/p 2:07:51 } +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1296/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 9.157618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43597 samples/s/p 2:07:38 } +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1298/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 9.152019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43866 samples/s/p 2:07:31 } +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1300/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 9.146418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43812 samples/s/p 2:07:29 } +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1302/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 9.140819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43475 samples/s/p 2:07:31 } +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1304/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 9.13522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43479 samples/s/p 2:07:28 } +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1306/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 9.129623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43472 samples/s/p 2:07:25 } +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1308/ 1625], loss: 0.967, per_step_time: 1472ms, lr: 9.124028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43117 samples/s/p 2:07:27 } +2024-07-25 23:04:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1310/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.118434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.44050 samples/s/p 2:07:11 } +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1312/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 9.112841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:28,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43335 samples/s/p 2:07:18 } +2024-07-25 23:04:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1314/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 9.107252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43980 samples/s/p 2:07:06 } +2024-07-25 23:04:34,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1316/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 9.101657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43290 samples/s/p 2:07:13 } +2024-07-25 23:04:37,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1318/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 9.0960675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:37,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43861 samples/s/p 2:07:02 } +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1320/ 1625], loss: 1.109, per_step_time: 1474ms, lr: 9.090482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:40,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.42417 samples/s/p 2:07:19 } +2024-07-25 23:04:43,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1322/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 9.084893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:43,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43503 samples/s/p 2:07:01 } +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1324/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 9.079306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43201 samples/s/p 2:07:02 } +2024-07-25 23:04:49,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1326/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 9.073725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:49,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43568 samples/s/p 2:06:54 } +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1328/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 9.068137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43225 samples/s/p 2:06:56 } +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1330/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.062558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:55,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43585 samples/s/p 2:06:48 } +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1332/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 9.056976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.44114 samples/s/p 2:06:38 } +2024-07-25 23:05:01,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1334/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 9.051393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:01,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43556 samples/s/p 2:06:43 } +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1336/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 9.045816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:04,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43710 samples/s/p 2:06:38 } +2024-07-25 23:05:07,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1338/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.040239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:07,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43194 samples/s/p 2:06:42 } +2024-07-25 23:05:09,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1340/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 9.034659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:10,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43511 samples/s/p 2:06:35 } +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1342/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 9.029087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43599 samples/s/p 2:06:30 } +2024-07-25 23:05:15,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1344/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 9.023513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:15,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43464 samples/s/p 2:06:29 } +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1346/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 9.017939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43757 samples/s/p 2:06:22 } +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1348/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 9.012367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:21,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43591 samples/s/p 2:06:22 } +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1350/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 9.006797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43775 samples/s/p 2:06:16 } +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1352/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 9.001227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.44012 samples/s/p 2:06:10 } +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1354/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 8.995658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42952 samples/s/p 2:06:22 } +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1356/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 8.990091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42566 samples/s/p 2:06:24 } +2024-07-25 23:05:36,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1358/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 8.984529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:36,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43205 samples/s/p 2:06:12 } +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1360/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 8.978961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:39,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44067 samples/s/p 2:05:57 } +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1362/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 8.973397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:42,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43854 samples/s/p 2:05:57 } +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1364/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 8.967838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:45,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.42754 samples/s/p 2:06:10 } +2024-07-25 23:05:48,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1366/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 8.962274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:48,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43132 samples/s/p 2:06:02 } +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1368/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 8.956715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43571 samples/s/p 2:05:53 } +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1370/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 8.951159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43860 samples/s/p 2:05:46 } +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1372/ 1625], loss: 1.034, per_step_time: 1468ms, lr: 8.945599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:57,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44686 samples/s/p 2:05:31 } +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1374/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 8.940045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43747 samples/s/p 2:05:41 } +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1376/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 8.93449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43673 samples/s/p 2:05:39 } +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1378/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 8.928933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43187 samples/s/p 2:05:43 } +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1380/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 8.923384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43035 samples/s/p 2:05:42 } +2024-07-25 23:06:11,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1382/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 8.917832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:11,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42607 samples/s/p 2:05:45 } +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1384/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 8.912279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:14,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43439 samples/s/p 2:05:31 } +2024-07-25 23:06:17,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1386/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 8.906733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:17,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43045 samples/s/p 2:05:33 } +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1388/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 8.9011855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43795 samples/s/p 2:05:20 } +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1390/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 8.8956385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:23,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43965 samples/s/p 2:05:15 } +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1392/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 8.890093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43708 samples/s/p 2:05:15 } +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1394/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 8.884548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:29,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43508 samples/s/p 2:05:15 } +2024-07-25 23:06:32,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1396/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 8.879007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:32,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43606 samples/s/p 2:05:11 } +2024-07-25 23:06:35,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1398/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 8.873465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42943 samples/s/p 2:05:17 } +2024-07-25 23:06:38,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1400/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 8.8679235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:38,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43928 samples/s/p 2:05:00 } +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1402/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.862388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43014 samples/s/p 2:05:10 } +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1404/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 8.856847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:44,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43128 samples/s/p 2:05:06 } +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1406/ 1625], loss: 0.921, per_step_time: 1470ms, lr: 8.851311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44121 samples/s/p 2:04:49 } +2024-07-25 23:06:50,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1408/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 8.845777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:50,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43893 samples/s/p 2:04:49 } +2024-07-25 23:06:53,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1410/ 1625], loss: 1.035, per_step_time: 1474ms, lr: 8.840241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:53,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42719 samples/s/p 2:05:02 } +2024-07-25 23:06:56,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.834708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:56,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43842 samples/s/p 2:04:44 } +2024-07-25 23:06:59,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1414/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 8.829178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:59,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42901 samples/s/p 2:04:54 } +2024-07-25 23:07:02,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1416/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 8.823646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:02,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43697 samples/s/p 2:04:40 } +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1418/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 8.81812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43801 samples/s/p 2:04:36 } +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1420/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 8.81259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44016 samples/s/p 2:04:30 } +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1422/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 8.80706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44436 samples/s/p 2:04:21 } +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1424/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 8.801538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43146 samples/s/p 2:04:36 } +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1426/ 1625], loss: 1.248, per_step_time: 1469ms, lr: 8.796013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44229 samples/s/p 2:04:18 } +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1428/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 8.79049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43988 samples/s/p 2:04:18 } +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1430/ 1625], loss: 1.459, per_step_time: 1470ms, lr: 8.7849685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43891 samples/s/p 2:04:17 } +2024-07-25 23:07:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1432/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 8.779447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43748 samples/s/p 2:04:16 } +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1434/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 8.773927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43171 samples/s/p 2:04:21 } +2024-07-25 23:07:31,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1436/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 8.76841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:31,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43067 samples/s/p 2:04:19 } +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1438/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.762892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43423 samples/s/p 2:04:12 } +2024-07-25 23:07:37,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1440/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 8.757377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:37,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43327 samples/s/p 2:04:10 } +2024-07-25 23:07:40,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1442/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.751863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:40,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43164 samples/s/p 2:04:09 } +2024-07-25 23:07:43,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1444/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 8.746349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:43,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43316 samples/s/p 2:04:04 } +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1446/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 8.740837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43818 samples/s/p 2:03:54 } +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1448/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.7353255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43062 samples/s/p 2:04:02 } +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1450/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.729817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43762 samples/s/p 2:03:49 } +2024-07-25 23:07:52,300 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:08:28,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1452/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 8.724312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:28,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43482 samples/s/p 2:03:50 } +2024-07-25 23:08:31,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1454/ 1625], loss: 1.010, per_step_time: 1474ms, lr: 8.718801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:31,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.42420 samples/s/p 2:04:02 } +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1456/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 8.713299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.42821 samples/s/p 2:03:53 } +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1458/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 8.707794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:37,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44152 samples/s/p 2:03:32 } +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1460/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 8.702288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44040 samples/s/p 2:03:31 } +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1462/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 8.696789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:43,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43778 samples/s/p 2:03:31 } +2024-07-25 23:08:46,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1464/ 1625], loss: 1.277, per_step_time: 1477ms, lr: 8.691288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.41383 samples/s/p 2:04:01 } +2024-07-25 23:08:49,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1466/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 8.685786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:49,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43394 samples/s/p 2:03:31 } +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1468/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 8.680291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43587 samples/s/p 2:03:25 } +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1470/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 8.674794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43608 samples/s/p 2:03:22 } +2024-07-25 23:08:58,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1472/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 8.669298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:58,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43496 samples/s/p 2:03:20 } +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1474/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 8.663804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43049 samples/s/p 2:03:24 } +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1476/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 8.658311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:04,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43417 samples/s/p 2:03:16 } +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1478/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 8.652818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43478 samples/s/p 2:03:12 } +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1480/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 8.647328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42800 samples/s/p 2:03:18 } +2024-07-25 23:09:13,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1482/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 8.641839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:13,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42883 samples/s/p 2:03:14 } +2024-07-25 23:09:16,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1484/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.63635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43251 samples/s/p 2:03:06 } +2024-07-25 23:09:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1486/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.630864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43677 samples/s/p 2:02:57 } +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1488/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 8.625377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43643 samples/s/p 2:02:55 } +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1490/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.619893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43108 samples/s/p 2:02:59 } +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1492/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 8.614409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43841 samples/s/p 2:02:46 } +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1494/ 1625], loss: 0.945, per_step_time: 1474ms, lr: 8.6089285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.42570 samples/s/p 2:03:01 } +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1496/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 8.603447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:33,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43587 samples/s/p 2:02:44 } +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1498/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 8.597967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43515 samples/s/p 2:02:42 } +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1500/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 8.592493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:39,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43991 samples/s/p 2:02:33 } +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1502/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 8.587017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43551 samples/s/p 2:02:36 } +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1504/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 8.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43841 samples/s/p 2:02:29 } +2024-07-25 23:09:48,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1506/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 8.576068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:48,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43643 samples/s/p 2:02:28 } +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1508/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 8.570594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42966 samples/s/p 2:02:35 } +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1510/ 1625], loss: 1.236, per_step_time: 1474ms, lr: 8.565119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42600 samples/s/p 2:02:37 } +2024-07-25 23:09:57,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1512/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 8.559652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:57,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42826 samples/s/p 2:02:31 } +2024-07-25 23:10:00,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1514/ 1625], loss: 0.986, per_step_time: 1469ms, lr: 8.554183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:00,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.44432 samples/s/p 2:02:06 } +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1516/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 8.548715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43871 samples/s/p 2:02:11 } +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1518/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 8.543249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43872 samples/s/p 2:02:08 } +2024-07-25 23:10:09,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1520/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 8.537784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:09,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.44100 samples/s/p 2:02:02 } +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1522/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.532321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43109 samples/s/p 2:02:12 } +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1524/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.5268575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:15,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43395 samples/s/p 2:02:05 } +2024-07-25 23:10:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1526/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 8.521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43671 samples/s/p 2:01:59 } +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1528/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 8.515936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43352 samples/s/p 2:02:00 } +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1530/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 8.5104775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43917 samples/s/p 2:01:49 } +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1532/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 8.505021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43471 samples/s/p 2:01:52 } +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1534/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 8.499564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43747 samples/s/p 2:01:46 } +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1536/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 8.494109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43800 samples/s/p 2:01:42 } +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1538/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 8.488656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42955 samples/s/p 2:01:51 } +2024-07-25 23:10:38,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1540/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 8.483204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:38,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43893 samples/s/p 2:01:35 } +2024-07-25 23:10:41,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1542/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 8.477753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:41,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43159 samples/s/p 2:01:42 } +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1544/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 8.472306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:44,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43642 samples/s/p 2:01:33 } +2024-07-25 23:10:47,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1546/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 8.4668545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:47,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42715 samples/s/p 2:01:42 } +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1548/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 8.461408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43208 samples/s/p 2:01:32 } +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1550/ 1625], loss: 1.124, per_step_time: 1482ms, lr: 8.455965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.39665 samples/s/p 2:02:17 } +2024-07-25 23:10:56,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1552/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 8.45052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:56,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.42891 samples/s/p 2:01:31 } +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1554/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 8.445074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:59,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43555 samples/s/p 2:01:19 } +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1556/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 8.439636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43865 samples/s/p 2:01:12 } +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1558/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 8.434195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43719 samples/s/p 2:01:11 } +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1560/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 8.428756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:08,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43757 samples/s/p 2:01:07 } +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1562/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 8.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43915 samples/s/p 2:01:02 } +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1564/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.41788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:14,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43596 samples/s/p 2:01:04 } +2024-07-25 23:11:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1566/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 8.412446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43319 samples/s/p 2:01:04 } +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1568/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.407012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43557 samples/s/p 2:00:58 } +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1570/ 1625], loss: 1.127, per_step_time: 1474ms, lr: 8.401578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.42741 samples/s/p 2:01:06 } +2024-07-25 23:11:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1572/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 8.396148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.44254 samples/s/p 2:00:43 } +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1574/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 8.390716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43953 samples/s/p 2:00:44 } +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1576/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 8.385287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:31,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43785 samples/s/p 2:00:44 } +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1578/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 8.37986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43783 samples/s/p 2:00:41 } +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1580/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.3744335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43616 samples/s/p 2:00:40 } +2024-07-25 23:11:40,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1582/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 8.369009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:40,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43744 samples/s/p 2:00:35 } +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1584/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 8.363585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:43,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43346 samples/s/p 2:00:38 } +2024-07-25 23:11:46,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1586/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 8.358163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.41991 samples/s/p 2:00:53 } +2024-07-25 23:11:49,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1588/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 8.352746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:49,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43596 samples/s/p 2:00:28 } +2024-07-25 23:11:52,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1590/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.347323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:52,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43400 samples/s/p 2:00:28 } +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1592/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 8.3419045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43190 samples/s/p 2:00:28 } +2024-07-25 23:11:58,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1594/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 8.33649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:58,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43044 samples/s/p 2:00:27 } +2024-07-25 23:12:01,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1596/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 8.3310715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:01,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43981 samples/s/p 2:00:12 } +2024-07-25 23:12:04,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1598/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 8.325661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:04,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43683 samples/s/p 2:00:13 } +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.320248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43575 samples/s/p 2:00:11 } +2024-07-25 23:12:10,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1602/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 8.314836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43709 samples/s/p 2:00:06 } +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1604/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 8.3094255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:13,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43964 samples/s/p 2:00:00 } +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1606/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 8.304017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43353 samples/s/p 2:00:05 } +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1608/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 8.298609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43083 samples/s/p 2:00:06 } +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1610/ 1625], loss: 0.941, per_step_time: 1472ms, lr: 8.293203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43478 samples/s/p 1:59:58 } +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1612/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.287798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:24,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.44013 samples/s/p 1:59:48 } +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1614/ 1625], loss: 1.266, per_step_time: 1476ms, lr: 8.282394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:27,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.41647 samples/s/p 2:00:16 } +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1616/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 8.276991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43268 samples/s/p 1:59:52 } +2024-07-25 23:12:33,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1618/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.271591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:33,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43625 samples/s/p 1:59:44 } +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1620/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 8.266191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43613 samples/s/p 1:59:41 } +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1622/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 8.260793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43826 samples/s/p 1:59:35 } +2024-07-25 23:12:42,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1624/ 1625], loss: 1.285, per_step_time: 1474ms, lr: 8.255394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:42,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.42400 samples/s/p 1:59:51 } +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 8.250003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:45,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43736 samples/s/p 1:59:31 } +2024-07-25 23:12:48,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 3/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 8.244605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:48,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43580 samples/s/p 1:59:30 } +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 5/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 8.239212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43408 samples/s/p 1:59:29 } +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 7/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 8.233824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.44003 samples/s/p 1:59:18 } +2024-07-25 23:12:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 9/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 8.2284305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43614 samples/s/p 1:59:20 } +2024-07-25 23:13:00,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 11/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 8.223042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:00,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43805 samples/s/p 1:59:15 } +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 13/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 8.217657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43815 samples/s/p 1:59:12 } +2024-07-25 23:13:06,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 15/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 8.212267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:06,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43585 samples/s/p 1:59:12 } +2024-07-25 23:13:09,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 17/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.2068855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:09,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43279 samples/s/p 1:59:13 } +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 19/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.201501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:12,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43669 samples/s/p 1:59:05 } +2024-07-25 23:13:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 21/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 8.196116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.44097 samples/s/p 1:58:56 } +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 23/ 1625], loss: 1.287, per_step_time: 1475ms, lr: 8.190739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.42332 samples/s/p 1:59:17 } +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 25/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 8.185359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:20,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43405 samples/s/p 1:59:00 } +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 27/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.179981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.44081 samples/s/p 1:58:48 } +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 29/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 8.174604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:26,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43791 samples/s/p 1:58:49 } +2024-07-25 23:13:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 31/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 8.169228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:29,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43249 samples/s/p 1:58:53 } +2024-07-25 23:13:32,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 33/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.163854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:32,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43669 samples/s/p 1:58:44 } +2024-07-25 23:13:35,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 35/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.158482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:35,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43491 samples/s/p 1:58:44 } +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 37/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.153111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:38,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43513 samples/s/p 1:58:41 } +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 39/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 8.14774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43523 samples/s/p 1:58:38 } +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 41/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 8.1423705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43684 samples/s/p 1:58:32 } +2024-07-25 23:13:47,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 43/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 8.1370035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:47,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43876 samples/s/p 1:58:27 } +2024-07-25 23:13:50,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 45/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 8.13164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:50,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43695 samples/s/p 1:58:26 } +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 47/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 8.126273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:53,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43634 samples/s/p 1:58:24 } +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 49/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 8.120909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42340 samples/s/p 1:58:38 } +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 51/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 8.11555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43306 samples/s/p 1:58:23 } +2024-07-25 23:14:02,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 53/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 8.110187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:02,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42062 samples/s/p 1:58:36 } +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 55/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 8.104828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:05,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43693 samples/s/p 1:58:12 } +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 57/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 8.099473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43381 samples/s/p 1:58:13 } +2024-07-25 23:14:11,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 59/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 8.094114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:11,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43677 samples/s/p 1:58:06 } +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 61/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 8.088761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.44008 samples/s/p 1:57:59 } +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 63/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 8.083408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43898 samples/s/p 1:57:57 } +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 65/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 8.078052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43425 samples/s/p 1:58:01 } +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 67/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 8.072704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43845 samples/s/p 1:57:52 } +2024-07-25 23:14:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 69/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 8.067355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:25,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43211 samples/s/p 1:57:57 } +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 71/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 8.062004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43967 samples/s/p 1:57:45 } +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 73/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 8.05666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43256 samples/s/p 1:57:51 } +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 75/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.051315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43283 samples/s/p 1:57:48 } +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 77/ 1625], loss: 0.892, per_step_time: 1470ms, lr: 8.0459695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.44078 samples/s/p 1:57:34 } +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 79/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 8.040627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42795 samples/s/p 1:57:48 } +2024-07-25 23:14:43,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 81/ 1625], loss: 1.188, per_step_time: 1475ms, lr: 8.035286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:43,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42091 samples/s/p 1:57:54 } +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 83/ 1625], loss: 0.976, per_step_time: 1473ms, lr: 8.029945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:46,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42907 samples/s/p 1:57:41 } +2024-07-25 23:14:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 85/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 8.024606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:49,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43292 samples/s/p 1:57:33 } +2024-07-25 23:14:52,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 87/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 8.019269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:52,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43609 samples/s/p 1:57:26 } +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 89/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.013937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43617 samples/s/p 1:57:23 } +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 91/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 8.008599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:58,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43146 samples/s/p 1:57:26 } +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 93/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 8.003266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43572 samples/s/p 1:57:17 } +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 95/ 1625], loss: 1.204, per_step_time: 1468ms, lr: 7.997937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.44703 samples/s/p 1:57:00 } +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 97/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 7.992605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43474 samples/s/p 1:57:13 } +2024-07-25 23:15:10,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 99/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 7.987275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:10,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43479 samples/s/p 1:57:10 } +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 101/ 1625], loss: 0.903, per_step_time: 1473ms, lr: 7.981951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43023 samples/s/p 1:57:13 } +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 103/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 7.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43697 samples/s/p 1:57:01 } +2024-07-25 23:15:19,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 105/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 7.9713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:19,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43361 samples/s/p 1:57:02 } +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 7.965976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43989 samples/s/p 1:56:51 } +2024-07-25 23:15:24,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 109/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 7.960652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:24,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43006 samples/s/p 1:57:01 } +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 111/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 7.955334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.44118 samples/s/p 1:56:44 } +2024-07-25 23:15:30,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 113/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.950014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:30,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43747 samples/s/p 1:56:46 } +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 115/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 7.944696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.44058 samples/s/p 1:56:39 } +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 117/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.93938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43463 samples/s/p 1:56:43 } +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 119/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 7.934065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:39,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43448 samples/s/p 1:56:41 } +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 121/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 7.928752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42806 samples/s/p 1:56:46 } +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 123/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 7.923439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:45,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44131 samples/s/p 1:56:26 } +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.918128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44074 samples/s/p 1:56:24 } +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 127/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 7.912819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:51,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43261 samples/s/p 1:56:31 } +2024-07-25 23:15:54,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 129/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 7.907511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:54,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43069 samples/s/p 1:56:31 } +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 131/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 7.902204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43078 samples/s/p 1:56:28 } +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 133/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 7.8969015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43861 samples/s/p 1:56:15 } +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 135/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 7.8915955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:03,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43813 samples/s/p 1:56:12 } +2024-07-25 23:16:06,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 137/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 7.886293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:06,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43810 samples/s/p 1:56:10 } +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 139/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 7.880994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:09,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43468 samples/s/p 1:56:11 } +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 141/ 1625], loss: 0.940, per_step_time: 1471ms, lr: 7.875692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:12,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43521 samples/s/p 1:56:07 } +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 143/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 7.870396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:15,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44194 samples/s/p 1:55:56 } +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 145/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.8651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:18,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44045 samples/s/p 1:55:55 } +2024-07-25 23:16:20,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 147/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 7.859801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:20,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.42980 samples/s/p 1:56:06 } +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 149/ 1625], loss: 0.906, per_step_time: 1470ms, lr: 7.85451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:23,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43903 samples/s/p 1:55:51 } +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 151/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 7.8492185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43714 samples/s/p 1:55:50 } +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 153/ 1625], loss: 1.019, per_step_time: 1472ms, lr: 7.843923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43471 samples/s/p 1:55:50 } +2024-07-25 23:16:32,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 155/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.838637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:32,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43936 samples/s/p 1:55:41 } +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 157/ 1625], loss: 1.018, per_step_time: 1472ms, lr: 7.833349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43428 samples/s/p 1:55:45 } +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 159/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 7.828062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43971 samples/s/p 1:55:35 } +2024-07-25 23:16:41,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 161/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 7.822776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:41,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43778 samples/s/p 1:55:35 } +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 163/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 7.817492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43409 samples/s/p 1:55:36 } +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 165/ 1625], loss: 1.167, per_step_time: 1469ms, lr: 7.812209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:47,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.44556 samples/s/p 1:55:19 } +2024-07-25 23:16:50,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 7.806928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:50,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43770 samples/s/p 1:55:26 } +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 169/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 7.801648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43097 samples/s/p 1:55:32 } +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 171/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 7.7963705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43616 samples/s/p 1:55:22 } +2024-07-25 23:16:59,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 173/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 7.791093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:59,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43038 samples/s/p 1:55:26 } +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 175/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 7.785818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:02,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44220 samples/s/p 1:55:08 } +2024-07-25 23:17:05,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 177/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 7.780546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:05,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44204 samples/s/p 1:55:06 } +2024-07-25 23:17:08,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 179/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 7.77527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:08,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43839 samples/s/p 1:55:07 } +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 181/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 7.77e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44208 samples/s/p 1:55:00 } +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 183/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.764732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44012 samples/s/p 1:54:59 } +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 185/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 7.7594605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44027 samples/s/p 1:54:56 } +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 187/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.754196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44014 samples/s/p 1:54:53 } +2024-07-25 23:17:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 189/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 7.748931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:22,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43090 samples/s/p 1:55:02 } +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 191/ 1625], loss: 1.170, per_step_time: 1469ms, lr: 7.743663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44462 samples/s/p 1:54:42 } +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 193/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 7.738405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43143 samples/s/p 1:54:56 } +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 195/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 7.733143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:31,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43099 samples/s/p 1:54:53 } +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 197/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 7.72788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43145 samples/s/p 1:54:50 } +2024-07-25 23:17:37,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 199/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 7.722625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43732 samples/s/p 1:54:39 } +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 201/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 7.717367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43430 samples/s/p 1:54:40 } +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 203/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 7.712112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:43,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43443 samples/s/p 1:54:37 } +2024-07-25 23:17:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 205/ 1625], loss: 0.943, per_step_time: 1471ms, lr: 7.706858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:46,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43636 samples/s/p 1:54:32 } +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 207/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 7.701605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43238 samples/s/p 1:54:34 } +2024-07-25 23:17:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 209/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 7.696354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:52,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43001 samples/s/p 1:54:34 } +2024-07-25 23:17:55,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 211/ 1625], loss: 1.014, per_step_time: 1477ms, lr: 7.691104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:55,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.41283 samples/s/p 1:54:53 } +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 213/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 7.685856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:58,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43365 samples/s/p 1:54:23 } +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 215/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 7.680609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:01,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.44207 samples/s/p 1:54:10 } +2024-07-25 23:18:04,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 217/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 7.675363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:04,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43518 samples/s/p 1:54:16 } +2024-07-25 23:18:07,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 219/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 7.67012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:07,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43410 samples/s/p 1:54:14 } +2024-07-25 23:18:10,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 221/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 7.664877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:10,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44042 samples/s/p 1:54:03 } +2024-07-25 23:18:13,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 223/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 7.659636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:13,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.42904 samples/s/p 1:54:14 } +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 225/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.654396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43974 samples/s/p 1:53:58 } +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 227/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 7.649158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:19,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43796 samples/s/p 1:53:57 } +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 229/ 1625], loss: 0.986, per_step_time: 1482ms, lr: 7.643921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.39577 samples/s/p 1:54:48 } +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 231/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 7.638689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44034 samples/s/p 1:53:48 } +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 233/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 7.6334545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:27,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44158 samples/s/p 1:53:44 } +2024-07-25 23:18:30,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 235/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.628219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43414 samples/s/p 1:53:50 } +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 7.6229917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43601 samples/s/p 1:53:45 } +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 239/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 7.617762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43496 samples/s/p 1:53:43 } +2024-07-25 23:18:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 241/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 7.6125307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:39,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43196 samples/s/p 1:53:44 } +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 243/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 7.607307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:42,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43294 samples/s/p 1:53:40 } +2024-07-25 23:18:45,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.602082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:45,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43363 samples/s/p 1:53:36 } +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 247/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 7.5968583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43960 samples/s/p 1:53:26 } +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 249/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 7.5916355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.44063 samples/s/p 1:53:22 } +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 251/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.586415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:54,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43777 samples/s/p 1:53:22 } +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 253/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 7.581196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43673 samples/s/p 1:53:21 } +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 255/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 7.575978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44123 samples/s/p 1:53:12 } +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 257/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 7.5707617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:03,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44092 samples/s/p 1:53:10 } +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 259/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 7.5655466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:06,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43089 samples/s/p 1:53:19 } +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 261/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 7.5603334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:09,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43518 samples/s/p 1:53:11 } +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 263/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.555121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43819 samples/s/p 1:53:04 } +2024-07-25 23:19:15,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 265/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 7.54991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44049 samples/s/p 1:52:58 } +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 267/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 7.5447015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43427 samples/s/p 1:53:03 } +2024-07-25 23:19:20,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 269/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.5394933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43354 samples/s/p 1:53:01 } +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 271/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.5342878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43743 samples/s/p 1:52:53 } +2024-07-25 23:19:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 273/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 7.529083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:26,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43682 samples/s/p 1:52:51 } +2024-07-25 23:19:29,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 275/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.5238827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43787 samples/s/p 1:52:47 } +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 277/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 7.518678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43764 samples/s/p 1:52:44 } +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 279/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 7.513478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43516 samples/s/p 1:52:44 } +2024-07-25 23:19:38,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 281/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 7.508282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43443 samples/s/p 1:52:42 } +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 283/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 7.5030853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43772 samples/s/p 1:52:35 } +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 285/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 7.4978893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44046 samples/s/p 1:52:29 } +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 287/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 7.492694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43843 samples/s/p 1:52:29 } +2024-07-25 23:19:50,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 289/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 7.4875015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:50,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43365 samples/s/p 1:52:32 } +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 291/ 1625], loss: 1.135, per_step_time: 1475ms, lr: 7.4823097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42130 samples/s/p 1:52:44 } +2024-07-25 23:19:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 293/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.4771206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:56,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43197 samples/s/p 1:52:28 } +2024-07-25 23:19:59,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 295/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 7.471932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:59,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44073 samples/s/p 1:52:14 } +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 297/ 1625], loss: 1.064, per_step_time: 1473ms, lr: 7.4667446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:02,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43017 samples/s/p 1:52:24 } +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 299/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 7.4615587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43839 samples/s/p 1:52:11 } +2024-07-25 23:20:08,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 301/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 7.456376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:08,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43564 samples/s/p 1:52:11 } +2024-07-25 23:20:11,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 303/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 7.4511927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:11,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43462 samples/s/p 1:52:10 } +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 305/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 7.446012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43644 samples/s/p 1:52:04 } +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 307/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 7.4408326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42741 samples/s/p 1:52:13 } +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 309/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 7.435654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:20,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42849 samples/s/p 1:52:08 } +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 311/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 7.430478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43733 samples/s/p 1:51:55 } +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 313/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 7.4253053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43800 samples/s/p 1:51:51 } +2024-07-25 23:20:28,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 315/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 7.4201294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43919 samples/s/p 1:51:46 } +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 317/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 7.4149575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43584 samples/s/p 1:51:48 } +2024-07-25 23:20:34,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 319/ 1625], loss: 0.999, per_step_time: 1469ms, lr: 7.4097893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:34,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.44283 samples/s/p 1:51:36 } +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 321/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 7.4046175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43011 samples/s/p 1:51:49 } +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 323/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 7.39945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:40,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.42555 samples/s/p 1:51:51 } +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 325/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 7.394287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43562 samples/s/p 1:51:36 } +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 327/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.389119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43629 samples/s/p 1:51:32 } +2024-07-25 23:20:49,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 329/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 7.3839587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:49,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43402 samples/s/p 1:51:32 } +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 331/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 7.3787974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:52,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43391 samples/s/p 1:51:29 } +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 333/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 7.373637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43394 samples/s/p 1:51:26 } +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 335/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 7.368479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43429 samples/s/p 1:51:23 } +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 337/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.363322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:01,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43981 samples/s/p 1:51:13 } +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 339/ 1625], loss: 1.283, per_step_time: 1470ms, lr: 7.3581655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43889 samples/s/p 1:51:11 } +2024-07-25 23:21:07,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 341/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 7.353012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:07,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43965 samples/s/p 1:51:08 } +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 343/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 7.347859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:10,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.42796 samples/s/p 1:51:19 } +2024-07-25 23:21:13,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 345/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 7.342708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43266 samples/s/p 1:51:10 } +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 347/ 1625], loss: 1.077, per_step_time: 1469ms, lr: 7.337559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:16,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.44230 samples/s/p 1:50:56 } +2024-07-25 23:21:19,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 349/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 7.3324104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:19,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43226 samples/s/p 1:51:05 } +2024-07-25 23:21:21,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 351/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 7.3272636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:21,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44431 samples/s/p 1:50:47 } +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 353/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 7.3221186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43181 samples/s/p 1:51:00 } +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 355/ 1625], loss: 1.153, per_step_time: 1469ms, lr: 7.3169754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44417 samples/s/p 1:50:41 } +2024-07-25 23:21:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 7.311836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:30,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43462 samples/s/p 1:50:50 } +2024-07-25 23:21:33,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 359/ 1625], loss: 1.053, per_step_time: 1475ms, lr: 7.3066926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:33,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.42025 samples/s/p 1:51:05 } +2024-07-25 23:21:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 361/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 7.3015535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:36,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44081 samples/s/p 1:50:37 } +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 363/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.296419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43705 samples/s/p 1:50:38 } +2024-07-25 23:21:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 365/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 7.29128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:42,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43600 samples/s/p 1:50:37 } +2024-07-25 23:21:45,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 367/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 7.2861453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:45,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43901 samples/s/p 1:50:30 } +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 369/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 7.2810158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:48,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43908 samples/s/p 1:50:27 } +2024-07-25 23:21:51,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 371/ 1625], loss: 1.237, per_step_time: 1469ms, lr: 7.275881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:51,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44356 samples/s/p 1:50:19 } +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 373/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 7.2707544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43647 samples/s/p 1:50:24 } +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 375/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 7.2656258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43320 samples/s/p 1:50:25 } +2024-07-25 23:22:00,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 377/ 1625], loss: 1.169, per_step_time: 1469ms, lr: 7.2604957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:00,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44326 samples/s/p 1:50:10 } +2024-07-25 23:22:03,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 379/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 7.255374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:03,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43273 samples/s/p 1:50:20 } +2024-07-25 23:22:06,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 381/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 7.25025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:06,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43340 samples/s/p 1:50:16 } +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 383/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 7.245127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:09,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43727 samples/s/p 1:50:09 } +2024-07-25 23:22:12,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 385/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 7.2400067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43401 samples/s/p 1:50:10 } +2024-07-25 23:22:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 387/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 7.2348876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43243 samples/s/p 1:50:09 } +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 389/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 7.2297703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43975 samples/s/p 1:49:57 } +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 391/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 7.2246526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:20,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43784 samples/s/p 1:49:56 } +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 393/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 7.219539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:23,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.42838 samples/s/p 1:50:05 } +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 395/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 7.214425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43531 samples/s/p 1:49:53 } +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 397/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 7.209314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43659 samples/s/p 1:49:49 } +2024-07-25 23:22:32,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 399/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 7.2042035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:32,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43378 samples/s/p 1:49:49 } +2024-07-25 23:22:35,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 401/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 7.199098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:35,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.42429 samples/s/p 1:49:58 } +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 403/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 7.1939876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:38,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43138 samples/s/p 1:49:46 } +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 405/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 7.1888826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:41,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43847 samples/s/p 1:49:35 } +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 407/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 7.183781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43692 samples/s/p 1:49:34 } +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 409/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 7.1786762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43178 samples/s/p 1:49:37 } +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 411/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 7.1735753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43607 samples/s/p 1:49:29 } +2024-07-25 23:22:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 413/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 7.168479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:53,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.44013 samples/s/p 1:49:21 } +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 415/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.163378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:56,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43701 samples/s/p 1:49:22 } +2024-07-25 23:22:59,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 417/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.158285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:59,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.44008 samples/s/p 1:49:15 } +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 419/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 7.15319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:02,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43345 samples/s/p 1:49:20 } +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 421/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.148094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43522 samples/s/p 1:49:15 } +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 423/ 1625], loss: 1.299, per_step_time: 1470ms, lr: 7.1430045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:08,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43956 samples/s/p 1:49:07 } +2024-07-25 23:23:11,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 425/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 7.137915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:11,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.44054 samples/s/p 1:49:03 } +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 427/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 7.1328236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:14,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43862 samples/s/p 1:49:02 } +2024-07-25 23:23:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 429/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 7.127739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43836 samples/s/p 1:49:00 } +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 431/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 7.1226536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:19,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42914 samples/s/p 1:49:08 } +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 433/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 7.117569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:22,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43672 samples/s/p 1:48:56 } +2024-07-25 23:23:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 435/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 7.1124873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43821 samples/s/p 1:48:51 } +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 437/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 7.1074064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43789 samples/s/p 1:48:48 } +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 439/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.102327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.44399 samples/s/p 1:48:38 } +2024-07-25 23:23:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 441/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 7.097249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43621 samples/s/p 1:48:45 } +2024-07-25 23:23:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 443/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 7.092173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43606 samples/s/p 1:48:42 } +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 445/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 7.087101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42914 samples/s/p 1:48:47 } +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 447/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 7.082025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:43,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43648 samples/s/p 1:48:35 } +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 449/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.076954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43880 samples/s/p 1:48:30 } +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 451/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 7.0718866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43320 samples/s/p 1:48:34 } +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 453/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 7.066815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43486 samples/s/p 1:48:29 } +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 455/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 7.061751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:55,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43613 samples/s/p 1:48:24 } +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 457/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 7.0566857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:58,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43709 samples/s/p 1:48:20 } +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 459/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 7.0516194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:01,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43348 samples/s/p 1:48:21 } +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 461/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 7.0465603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43344 samples/s/p 1:48:19 } +2024-07-25 23:24:07,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 463/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 7.0415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:07,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43955 samples/s/p 1:48:08 } +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 465/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.0364367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43981 samples/s/p 1:48:05 } +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 467/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 7.0313827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43501 samples/s/p 1:48:08 } +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 469/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 7.026327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43109 samples/s/p 1:48:10 } +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 471/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 7.0212723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43511 samples/s/p 1:48:02 } +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 473/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 7.016219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43573 samples/s/p 1:47:58 } +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 475/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 7.0111682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:24,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43979 samples/s/p 1:47:50 } +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 477/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 7.0061183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43144 samples/s/p 1:47:57 } +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 479/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 7.00107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43358 samples/s/p 1:47:52 } +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 481/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.996024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:33,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43169 samples/s/p 1:47:51 } +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 483/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 6.9909815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43231 samples/s/p 1:47:47 } +2024-07-25 23:24:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 485/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 6.985936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:39,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42821 samples/s/p 1:47:49 } +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 487/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 6.980893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43370 samples/s/p 1:47:40 } +2024-07-25 23:24:45,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 489/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.975856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:45,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43577 samples/s/p 1:47:35 } +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 491/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 6.970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42836 samples/s/p 1:47:40 } +2024-07-25 23:24:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 493/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 6.965778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43440 samples/s/p 1:47:30 } +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 495/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 6.9607454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42972 samples/s/p 1:47:33 } +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 497/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 6.955708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43320 samples/s/p 1:47:26 } +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 499/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 6.950678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43910 samples/s/p 1:47:16 } +2024-07-25 23:25:03,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 501/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 6.9456473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:03,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43202 samples/s/p 1:47:21 } +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 503/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 6.9406155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.42961 samples/s/p 1:47:21 } +2024-07-25 23:25:09,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 505/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 6.9355906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:09,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43936 samples/s/p 1:47:07 } +2024-07-25 23:25:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 507/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 6.9305643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43300 samples/s/p 1:47:11 } +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 509/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 6.9255375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43939 samples/s/p 1:47:01 } +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 511/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 6.920517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43517 samples/s/p 1:47:03 } +2024-07-25 23:25:20,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 513/ 1625], loss: 1.141, per_step_time: 1477ms, lr: 6.9154958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.41596 samples/s/p 1:47:23 } +2024-07-25 23:25:23,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 515/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 6.910476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:23,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43027 samples/s/p 1:47:03 } +2024-07-25 23:25:26,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 517/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.905458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43187 samples/s/p 1:46:58 } +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 519/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.900441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:29,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43753 samples/s/p 1:46:48 } +2024-07-25 23:25:32,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 521/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 6.8954255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43996 samples/s/p 1:46:42 } +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 523/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 6.890413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43008 samples/s/p 1:46:51 } +2024-07-25 23:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 525/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 6.885401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:38,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43306 samples/s/p 1:46:45 } +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 527/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 6.880391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:41,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43130 samples/s/p 1:46:44 } +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 529/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 6.8753825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:44,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43672 samples/s/p 1:46:35 } +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 531/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 6.870375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43136 samples/s/p 1:46:38 } +2024-07-25 23:25:50,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 533/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 6.8653726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:50,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43360 samples/s/p 1:46:32 } +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 535/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 6.860366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43607 samples/s/p 1:46:26 } +2024-07-25 23:25:56,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 537/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 6.8553636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:56,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43608 samples/s/p 1:46:24 } +2024-07-25 23:25:59,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 539/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 6.8503664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:59,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43267 samples/s/p 1:46:25 } +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 541/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 6.8453637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:02,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43940 samples/s/p 1:46:14 } +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 543/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 6.840369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43884 samples/s/p 1:46:11 } +2024-07-25 23:26:08,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 545/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 6.835374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:08,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43625 samples/s/p 1:46:12 } +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 547/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 6.8303757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43169 samples/s/p 1:46:14 } +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 549/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 6.825386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:14,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43664 samples/s/p 1:46:05 } +2024-07-25 23:26:17,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 551/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 6.8203954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:17,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43474 samples/s/p 1:46:04 } +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 553/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 6.815403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43532 samples/s/p 1:46:01 } +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 555/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 6.810418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43699 samples/s/p 1:45:56 } +2024-07-25 23:26:25,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 557/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 6.8054314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:25,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43825 samples/s/p 1:45:52 } +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 559/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 6.800447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:28,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43216 samples/s/p 1:45:56 } +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 561/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 6.795464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43039 samples/s/p 1:45:55 } +2024-07-25 23:26:34,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 563/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 6.790483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:34,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43531 samples/s/p 1:45:46 } +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 565/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 6.785503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43399 samples/s/p 1:45:45 } +2024-07-25 23:26:40,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 567/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 6.780525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:40,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43053 samples/s/p 1:45:46 } +2024-07-25 23:26:43,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 569/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 6.7755473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:43,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43314 samples/s/p 1:45:40 } +2024-07-25 23:26:46,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 571/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 6.770573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:46,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43350 samples/s/p 1:45:36 } +2024-07-25 23:26:49,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 573/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 6.7655997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:49,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43566 samples/s/p 1:45:31 } +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 575/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.7606275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:52,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43548 samples/s/p 1:45:28 } +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 577/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 6.755657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43532 samples/s/p 1:45:26 } +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 579/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 6.7506894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:58,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43491 samples/s/p 1:45:23 } +2024-07-25 23:27:01,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 581/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 6.7457217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:01,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43146 samples/s/p 1:45:24 } +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 583/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 6.74076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:04,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.42925 samples/s/p 1:45:24 } +2024-07-25 23:27:07,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 585/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 6.735793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:07,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43508 samples/s/p 1:45:14 } +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 587/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 6.730834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43513 samples/s/p 1:45:11 } +2024-07-25 23:27:13,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 589/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.725873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:13,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43235 samples/s/p 1:45:11 } +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 591/ 1625], loss: 1.129, per_step_time: 1482ms, lr: 6.720911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.39664 samples/s/p 1:45:50 } +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 593/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 6.715957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43569 samples/s/p 1:45:02 } +2024-07-25 23:27:22,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 595/ 1625], loss: 0.980, per_step_time: 1471ms, lr: 6.7110013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:22,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43498 samples/s/p 1:44:59 } +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 597/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 6.7060473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43408 samples/s/p 1:44:58 } +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 599/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 6.701095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:27,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43957 samples/s/p 1:44:48 } +2024-07-25 23:27:30,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 601/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 6.6961447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:30,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43847 samples/s/p 1:44:47 } +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 603/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 6.691195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:33,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43815 samples/s/p 1:44:44 } +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 605/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 6.686248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:36,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43720 samples/s/p 1:44:42 } +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 607/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 6.681302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43684 samples/s/p 1:44:40 } +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 609/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 6.6763573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.42627 samples/s/p 1:44:49 } +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 611/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 6.6714156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.44064 samples/s/p 1:44:29 } +2024-07-25 23:27:48,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 613/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 6.6664743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:48,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43613 samples/s/p 1:44:32 } +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 615/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:51,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43690 samples/s/p 1:44:28 } +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 617/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 6.6565976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43670 samples/s/p 1:44:25 } +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 619/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.651661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43274 samples/s/p 1:44:27 } +2024-07-25 23:28:00,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 621/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 6.646727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:00,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43381 samples/s/p 1:44:23 } +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 6.6417933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43451 samples/s/p 1:44:19 } +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 625/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 6.6368652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43821 samples/s/p 1:44:12 } +2024-07-25 23:28:09,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 627/ 1625], loss: 1.269, per_step_time: 1475ms, lr: 6.631933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:09,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42302 samples/s/p 1:44:26 } +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 629/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 6.627005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43803 samples/s/p 1:44:06 } +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 631/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 6.6220814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:15,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43584 samples/s/p 1:44:05 } +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 633/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 6.6171565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43077 samples/s/p 1:44:08 } +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 635/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 6.612231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43350 samples/s/p 1:44:02 } +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 637/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 6.6073126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43517 samples/s/p 1:43:57 } +2024-07-25 23:28:26,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 639/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 6.602392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43587 samples/s/p 1:43:54 } +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 641/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 6.5974746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:29,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42995 samples/s/p 1:43:57 } +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 643/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 6.592558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.42943 samples/s/p 1:43:55 } +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 645/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 6.587644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43131 samples/s/p 1:43:50 } +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.5827303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43515 samples/s/p 1:43:43 } +2024-07-25 23:28:41,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 649/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 6.5778186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:41,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43502 samples/s/p 1:43:40 } +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 651/ 1625], loss: 1.034, per_step_time: 1473ms, lr: 6.5729087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43022 samples/s/p 1:43:42 } +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 653/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 6.5680006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:47,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43708 samples/s/p 1:43:32 } +2024-07-25 23:28:50,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 655/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 6.5630943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:50,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43979 samples/s/p 1:43:26 } +2024-07-25 23:28:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 657/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 6.5581894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:53,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43709 samples/s/p 1:43:26 } +2024-07-25 23:28:56,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 659/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 6.5532854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:56,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43637 samples/s/p 1:43:24 } +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 661/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 6.548384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43224 samples/s/p 1:43:25 } +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 663/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 6.543484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:02,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43040 samples/s/p 1:43:25 } +2024-07-25 23:29:05,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 665/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 6.538586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:05,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43511 samples/s/p 1:43:16 } +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 667/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.533689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43217 samples/s/p 1:43:17 } +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 669/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 6.5287973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43643 samples/s/p 1:43:09 } +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 671/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 6.5239014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43456 samples/s/p 1:43:08 } +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 673/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 6.5190097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43136 samples/s/p 1:43:09 } +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 675/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 6.514122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43543 samples/s/p 1:43:01 } +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 677/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.5092313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43677 samples/s/p 1:42:57 } +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 679/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.5043446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43665 samples/s/p 1:42:54 } +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 681/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 6.4994624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:28,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43204 samples/s/p 1:42:56 } +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 683/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 6.4945793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44238 samples/s/p 1:42:42 } +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 685/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 6.489697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43128 samples/s/p 1:42:51 } +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 687/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 6.4848173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43310 samples/s/p 1:42:46 } +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 689/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 6.4799387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44084 samples/s/p 1:42:34 } +2024-07-25 23:29:43,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 691/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 6.4750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:43,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44062 samples/s/p 1:42:32 } +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 693/ 1625], loss: 1.130, per_step_time: 1469ms, lr: 6.470187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44240 samples/s/p 1:42:27 } +2024-07-25 23:29:49,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 695/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 6.4653136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:49,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43419 samples/s/p 1:42:33 } +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 697/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 6.4604415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42763 samples/s/p 1:42:38 } +2024-07-25 23:29:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 699/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 6.4555716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43424 samples/s/p 1:42:27 } +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 701/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.450704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43554 samples/s/p 1:42:23 } +2024-07-25 23:30:01,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 703/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 6.4458363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:01,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42876 samples/s/p 1:42:28 } +2024-07-25 23:30:04,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 705/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 6.4409714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42821 samples/s/p 1:42:25 } +2024-07-25 23:30:07,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 707/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.4361084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:07,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42864 samples/s/p 1:42:22 } +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 709/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 6.4312467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43724 samples/s/p 1:42:09 } +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 711/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 6.426387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.44101 samples/s/p 1:42:02 } +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 713/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.4215315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43516 samples/s/p 1:42:06 } +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 715/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 6.4166716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:19,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43395 samples/s/p 1:42:04 } +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 717/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 6.4118162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:22,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43477 samples/s/p 1:42:00 } +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 719/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 6.406966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43591 samples/s/p 1:41:56 } +2024-07-25 23:30:27,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 721/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 6.4021115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:27,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42977 samples/s/p 1:42:00 } +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 723/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 6.397261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43507 samples/s/p 1:41:51 } +2024-07-25 23:30:33,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 725/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.3924163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:33,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43504 samples/s/p 1:41:48 } +2024-07-25 23:30:36,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 727/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 6.387567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:36,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43155 samples/s/p 1:41:49 } +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 729/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.382725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:39,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43323 samples/s/p 1:41:44 } +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 731/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 6.3778816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43250 samples/s/p 1:41:42 } +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 733/ 1625], loss: 1.059, per_step_time: 1469ms, lr: 6.373039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:45,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.44363 samples/s/p 1:41:27 } +2024-07-25 23:30:48,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 735/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 6.3682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:48,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43628 samples/s/p 1:41:32 } +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 737/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 6.363362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:51,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43777 samples/s/p 1:41:27 } +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 739/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 6.358525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43720 samples/s/p 1:41:25 } +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 741/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.353691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:57,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43771 samples/s/p 1:41:21 } +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 743/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 6.348857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43531 samples/s/p 1:41:21 } +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 745/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 6.3440257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43686 samples/s/p 1:41:17 } +2024-07-25 23:31:06,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 747/ 1625], loss: 1.055, per_step_time: 1470ms, lr: 6.3391963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:06,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43881 samples/s/p 1:41:11 } +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 749/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.334368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43788 samples/s/p 1:41:10 } +2024-07-25 23:31:12,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 751/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 6.3295415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:12,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43728 samples/s/p 1:41:07 } +2024-07-25 23:31:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 753/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 6.324717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43504 samples/s/p 1:41:07 } +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 755/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 6.3198936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43441 samples/s/p 1:41:05 } +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 757/ 1625], loss: 1.036, per_step_time: 1470ms, lr: 6.3150756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:21,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.44058 samples/s/p 1:40:55 } +2024-07-25 23:31:23,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 759/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 6.3102534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:23,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43625 samples/s/p 1:40:57 } +2024-07-25 23:31:26,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 761/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.3054354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:26,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43893 samples/s/p 1:40:51 } +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 763/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 6.3006214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43405 samples/s/p 1:40:53 } +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 765/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 6.295804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43301 samples/s/p 1:40:51 } +2024-07-25 23:31:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 767/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.2909953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:35,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43586 samples/s/p 1:40:45 } +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 769/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 6.2861827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:38,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.42203 samples/s/p 1:40:58 } +2024-07-25 23:31:41,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 771/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 6.2813715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:41,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43614 samples/s/p 1:40:39 } +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 773/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.276566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43645 samples/s/p 1:40:36 } +2024-07-25 23:31:47,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 775/ 1625], loss: 0.939, per_step_time: 1470ms, lr: 6.27176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:47,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44057 samples/s/p 1:40:28 } +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 777/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 6.2669537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43490 samples/s/p 1:40:32 } +2024-07-25 23:31:53,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 779/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.262154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:53,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43165 samples/s/p 1:40:32 } +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 781/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 6.2573527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43444 samples/s/p 1:40:26 } +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 783/ 1625], loss: 1.039, per_step_time: 1468ms, lr: 6.2525532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:59,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44658 samples/s/p 1:40:10 } +2024-07-25 23:32:02,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 785/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 6.2477557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:02,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43678 samples/s/p 1:40:18 } +2024-07-25 23:32:05,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 787/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 6.24296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43449 samples/s/p 1:40:17 } +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 789/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.238167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43578 samples/s/p 1:40:13 } +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 791/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 6.2333734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43675 samples/s/p 1:40:09 } +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 793/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 6.228583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43331 samples/s/p 1:40:10 } +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 795/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 6.2237973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:17,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43938 samples/s/p 1:40:00 } +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 797/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 6.219008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43024 samples/s/p 1:40:07 } +2024-07-25 23:32:23,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 799/ 1625], loss: 1.374, per_step_time: 1471ms, lr: 6.214222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:23,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43677 samples/s/p 1:39:57 } +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 801/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 6.2094405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.44165 samples/s/p 1:39:49 } +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 803/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 6.2046556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42887 samples/s/p 1:40:00 } +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 805/ 1625], loss: 1.395, per_step_time: 1471ms, lr: 6.1998753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43744 samples/s/p 1:39:48 } +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 807/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 6.1950996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:34,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.42714 samples/s/p 1:39:56 } +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 809/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.19032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43902 samples/s/p 1:39:40 } +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 811/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 6.1855476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43263 samples/s/p 1:39:44 } +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 813/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 6.180774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43719 samples/s/p 1:39:36 } +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 815/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.1759993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43305 samples/s/p 1:39:38 } +2024-07-25 23:32:49,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 817/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 6.1712317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43547 samples/s/p 1:39:32 } +2024-07-25 23:32:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 819/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 6.1664637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43804 samples/s/p 1:39:26 } +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 821/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 6.1616947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43884 samples/s/p 1:39:23 } +2024-07-25 23:32:58,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.1569326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:58,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43642 samples/s/p 1:39:22 } +2024-07-25 23:33:01,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 825/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 6.1521696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.44020 samples/s/p 1:39:15 } +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 827/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 6.1474075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43407 samples/s/p 1:39:19 } +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 829/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.142649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43327 samples/s/p 1:39:17 } +2024-07-25 23:33:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 831/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 6.13789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43758 samples/s/p 1:39:09 } +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 833/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 6.1331343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43117 samples/s/p 1:39:13 } +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 835/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.128379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.44103 samples/s/p 1:39:00 } +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 837/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 6.1236265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:19,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43575 samples/s/p 1:39:02 } +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 839/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.118878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43531 samples/s/p 1:39:00 } +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 841/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 6.1141263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43191 samples/s/p 1:39:01 } +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 843/ 1625], loss: 0.900, per_step_time: 1471ms, lr: 6.109379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43549 samples/s/p 1:38:54 } +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 845/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 6.1046358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43463 samples/s/p 1:38:52 } +2024-07-25 23:33:33,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 847/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 6.099888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:33,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43163 samples/s/p 1:38:52 } +2024-07-25 23:33:36,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 849/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 6.095147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:36,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43183 samples/s/p 1:38:49 } +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 851/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 6.090408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43520 samples/s/p 1:38:42 } +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 853/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 6.085667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.44180 samples/s/p 1:38:32 } +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 855/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 6.0809325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43942 samples/s/p 1:38:32 } +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 857/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.076197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:48,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43581 samples/s/p 1:38:33 } +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 859/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 6.071461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43892 samples/s/p 1:38:27 } +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 861/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.0667317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43381 samples/s/p 1:38:29 } +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 863/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 6.0620005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43416 samples/s/p 1:38:26 } +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 865/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 6.0572706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43646 samples/s/p 1:38:20 } +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 867/ 1625], loss: 1.016, per_step_time: 1469ms, lr: 6.0525454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.44218 samples/s/p 1:38:11 } +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 869/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 6.0478205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43726 samples/s/p 1:38:14 } +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 871/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 6.0430975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:09,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43940 samples/s/p 1:38:08 } +2024-07-25 23:34:12,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 873/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.038376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:12,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43637 samples/s/p 1:38:09 } +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 875/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.033657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43387 samples/s/p 1:38:08 } +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 877/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.028938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43478 samples/s/p 1:38:05 } +2024-07-25 23:34:21,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 879/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 6.024223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:21,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43371 samples/s/p 1:38:03 } +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 881/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 6.019508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43602 samples/s/p 1:37:57 } +2024-07-25 23:34:26,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 883/ 1625], loss: 0.990, per_step_time: 1469ms, lr: 6.0147977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:26,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.44252 samples/s/p 1:37:47 } +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 885/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 6.0100842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.42821 samples/s/p 1:38:00 } +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 887/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 6.005375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42805 samples/s/p 1:37:57 } +2024-07-25 23:34:35,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 889/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.0006705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:35,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43752 samples/s/p 1:37:44 } +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 891/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 5.995962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43045 samples/s/p 1:37:49 } +2024-07-25 23:34:41,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 893/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 5.9912577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:41,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43000 samples/s/p 1:37:46 } +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 895/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 5.986558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43033 samples/s/p 1:37:43 } +2024-07-25 23:34:47,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 897/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 5.9818544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:47,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43574 samples/s/p 1:37:34 } +2024-07-25 23:34:50,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 899/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 5.9771587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:50,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43324 samples/s/p 1:37:34 } +2024-07-25 23:34:53,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 901/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.9724625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:53,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43125 samples/s/p 1:37:33 } +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 903/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 5.9677636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:56,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43669 samples/s/p 1:37:24 } +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 905/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 5.963073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:59,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43429 samples/s/p 1:37:24 } +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 907/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 5.958381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43366 samples/s/p 1:37:22 } +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 909/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 5.9536887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43537 samples/s/p 1:37:17 } +2024-07-25 23:35:08,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 911/ 1625], loss: 0.999, per_step_time: 1473ms, lr: 5.9490035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43045 samples/s/p 1:37:19 } +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 913/ 1625], loss: 1.011, per_step_time: 1474ms, lr: 5.944317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.42681 samples/s/p 1:37:20 } +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 915/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 5.9396325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43440 samples/s/p 1:37:09 } +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 917/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 5.93495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.44444 samples/s/p 1:36:55 } +2024-07-25 23:35:20,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 919/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 5.930269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:20,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43931 samples/s/p 1:36:58 } +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 921/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 5.92559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43555 samples/s/p 1:36:59 } +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 923/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.9209115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:25,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43178 samples/s/p 1:37:00 } +2024-07-25 23:35:28,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 925/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.9162358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:28,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43475 samples/s/p 1:36:54 } +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 927/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 5.911562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:31,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43695 samples/s/p 1:36:49 } +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 929/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 5.90689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43327 samples/s/p 1:36:50 } +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 931/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 5.902219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43125 samples/s/p 1:36:49 } +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 933/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 5.897553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.42718 samples/s/p 1:36:50 } +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 935/ 1625], loss: 1.269, per_step_time: 1470ms, lr: 5.8928836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:43,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43964 samples/s/p 1:36:34 } +2024-07-25 23:35:46,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 937/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 5.8882206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:46,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43738 samples/s/p 1:36:33 } +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 939/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 5.883558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.42994 samples/s/p 1:36:38 } +2024-07-25 23:35:52,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 941/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 5.8788933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:52,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43212 samples/s/p 1:36:33 } +2024-07-25 23:35:55,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 943/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.8742357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:55,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43683 samples/s/p 1:36:25 } +2024-07-25 23:35:58,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 945/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 5.8695773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43266 samples/s/p 1:36:27 } +2024-07-25 23:36:01,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 947/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.8649184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:01,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43674 samples/s/p 1:36:19 } +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 949/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 5.8602677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43371 samples/s/p 1:36:20 } +2024-07-25 23:36:07,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 951/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 5.8556143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:07,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43514 samples/s/p 1:36:15 } +2024-07-25 23:36:10,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 953/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 5.8509636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:10,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43670 samples/s/p 1:36:11 } +2024-07-25 23:36:13,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 955/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 5.8463143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:13,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43972 samples/s/p 1:36:05 } +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 957/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.8416667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43225 samples/s/p 1:36:09 } +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 959/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 5.8370215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:19,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43284 samples/s/p 1:36:06 } +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 961/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 5.8323767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:22,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43129 samples/s/p 1:36:05 } +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 963/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 5.8277355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:24,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42752 samples/s/p 1:36:06 } +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 965/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 5.8230953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42985 samples/s/p 1:36:00 } +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 967/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.818457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43272 samples/s/p 1:35:54 } +2024-07-25 23:36:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 969/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 5.8138203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43958 samples/s/p 1:35:44 } +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 971/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 5.809185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:36,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.44045 samples/s/p 1:35:40 } +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 973/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 5.8045516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43758 samples/s/p 1:35:40 } +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 975/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.799921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:42,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43312 samples/s/p 1:35:42 } +2024-07-25 23:36:45,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 977/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 5.795291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:45,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43401 samples/s/p 1:35:38 } +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 979/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 5.790663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43566 samples/s/p 1:35:33 } +2024-07-25 23:36:51,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 981/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.78604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:51,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43414 samples/s/p 1:35:32 } +2024-07-25 23:36:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 983/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.7814163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43627 samples/s/p 1:35:27 } +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 985/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 5.7767907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44181 samples/s/p 1:35:18 } +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 987/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 5.7721727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43657 samples/s/p 1:35:21 } +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 989/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 5.7675543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43631 samples/s/p 1:35:18 } +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 991/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.7629345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43696 samples/s/p 1:35:14 } +2024-07-25 23:37:09,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 993/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 5.758322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:09,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43290 samples/s/p 1:35:16 } +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 995/ 1625], loss: 1.058, per_step_time: 1469ms, lr: 5.7537086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44365 samples/s/p 1:35:02 } +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 997/ 1625], loss: 1.046, per_step_time: 1473ms, lr: 5.749097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.42745 samples/s/p 1:35:16 } +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 999/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 5.7444868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:18,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43446 samples/s/p 1:35:05 } +2024-07-25 23:37:21,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1001/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 5.7398797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:21,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44172 samples/s/p 1:34:55 } +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1003/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 5.735274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:24,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44125 samples/s/p 1:34:52 } +2024-07-25 23:37:26,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1005/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 5.730669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:26,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43785 samples/s/p 1:34:53 } +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1007/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 5.726067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43372 samples/s/p 1:34:54 } +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1009/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 5.7214656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.42960 samples/s/p 1:34:56 } +2024-07-25 23:37:35,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1011/ 1625], loss: 1.017, per_step_time: 1469ms, lr: 5.716867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:35,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44255 samples/s/p 1:34:39 } +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1013/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 5.7122697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43555 samples/s/p 1:34:44 } +2024-07-25 23:37:41,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1015/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 5.7076745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:41,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43642 samples/s/p 1:34:40 } +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1017/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 5.7030807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:44,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43343 samples/s/p 1:34:40 } +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1019/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 5.698489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:47,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43210 samples/s/p 1:34:38 } +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1021/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 5.693899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43699 samples/s/p 1:34:30 } +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1023/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.6893105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:53,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43626 samples/s/p 1:34:28 } +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1025/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 5.684727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:56,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43469 samples/s/p 1:34:27 } +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1027/ 1625], loss: 0.913, per_step_time: 1474ms, lr: 5.6801396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42432 samples/s/p 1:34:35 } +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1029/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 5.675557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42818 samples/s/p 1:34:28 } +2024-07-25 23:38:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1031/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 5.670979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:05,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42645 samples/s/p 1:34:27 } +2024-07-25 23:38:08,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1033/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 5.6663994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:08,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43858 samples/s/p 1:34:11 } +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1035/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 5.6618196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43612 samples/s/p 1:34:11 } +2024-07-25 23:38:14,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1037/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 5.6572476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:14,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.44103 samples/s/p 1:34:03 } +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1039/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 5.652674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:17,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43000 samples/s/p 1:34:11 } +2024-07-25 23:38:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1041/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 5.648102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:20,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43797 samples/s/p 1:34:00 } +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1043/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 5.643532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43690 samples/s/p 1:33:58 } +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1045/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 5.6389636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43614 samples/s/p 1:33:56 } +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1047/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 5.6343974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43573 samples/s/p 1:33:53 } +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1049/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 5.629833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:31,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43453 samples/s/p 1:33:52 } +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1051/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.6252698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43508 samples/s/p 1:33:48 } +2024-07-25 23:38:37,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1053/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 5.620709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:37,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43578 samples/s/p 1:33:44 } +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1055/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 5.616151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43718 samples/s/p 1:33:40 } +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1057/ 1625], loss: 0.878, per_step_time: 1472ms, lr: 5.6115937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43202 samples/s/p 1:33:42 } +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1059/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.607038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43477 samples/s/p 1:33:37 } +2024-07-25 23:38:49,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1061/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 5.602484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:49,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43644 samples/s/p 1:33:32 } +2024-07-25 23:38:52,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1063/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 5.597932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:52,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43975 samples/s/p 1:33:26 } +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1065/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 5.593383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.44054 samples/s/p 1:33:22 } +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1067/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 5.588834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43313 samples/s/p 1:33:27 } +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1069/ 1625], loss: 1.022, per_step_time: 1476ms, lr: 5.5842916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.41713 samples/s/p 1:33:40 } +2024-07-25 23:39:04,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1071/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.5797436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:04,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43711 samples/s/p 1:33:17 } +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1073/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 5.575201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43063 samples/s/p 1:33:20 } +2024-07-25 23:39:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1075/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 5.570663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43536 samples/s/p 1:33:13 } +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1077/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 5.566121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.44015 samples/s/p 1:33:05 } +2024-07-25 23:39:16,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1079/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 5.5615847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:16,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42976 samples/s/p 1:33:12 } +2024-07-25 23:39:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1081/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 5.5570517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:19,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44010 samples/s/p 1:32:59 } +2024-07-25 23:39:22,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1083/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 5.5525184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:22,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43466 samples/s/p 1:33:01 } +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1085/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 5.5479873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44224 samples/s/p 1:32:51 } +2024-07-25 23:39:27,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1087/ 1625], loss: 0.904, per_step_time: 1471ms, lr: 5.5434575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:27,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43692 samples/s/p 1:32:53 } +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1089/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 5.5389296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43810 samples/s/p 1:32:49 } +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1091/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 5.5344026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:33,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43589 samples/s/p 1:32:48 } +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1093/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 5.5298788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43195 samples/s/p 1:32:50 } +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1095/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 5.5253563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43693 samples/s/p 1:32:41 } +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1097/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.520836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:42,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43732 samples/s/p 1:32:38 } +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1099/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.516317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43384 samples/s/p 1:32:39 } +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1101/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 5.5118003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43115 samples/s/p 1:32:39 } +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1103/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 5.507285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:51,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.42621 samples/s/p 1:32:41 } +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 5.502772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:54,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43485 samples/s/p 1:32:29 } +2024-07-25 23:39:57,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1107/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 5.4982634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:57,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43253 samples/s/p 1:32:28 } +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1109/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 5.493752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43356 samples/s/p 1:32:24 } +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 5.489244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:03,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43818 samples/s/p 1:32:17 } +2024-07-25 23:40:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1113/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.484741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43460 samples/s/p 1:32:17 } +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1115/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 5.4802344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44147 samples/s/p 1:32:07 } +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1117/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.475732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43840 samples/s/p 1:32:08 } +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1119/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 5.471234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43493 samples/s/p 1:32:08 } +2024-07-25 23:40:18,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1121/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 5.466733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43371 samples/s/p 1:32:06 } +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1123/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.4622396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:21,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43507 samples/s/p 1:32:02 } +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1125/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 5.4577445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:24,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44028 samples/s/p 1:31:54 } +2024-07-25 23:40:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1127/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 5.4532497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43775 samples/s/p 1:31:54 } +2024-07-25 23:40:29,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1129/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 5.4487605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43324 samples/s/p 1:31:55 } +2024-07-25 23:40:32,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1473ms, lr: 5.4442717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43021 samples/s/p 1:31:55 } +2024-07-25 23:40:35,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1133/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 5.439784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:35,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43482 samples/s/p 1:31:48 } +2024-07-25 23:40:38,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1135/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 5.4352986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:38,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43277 samples/s/p 1:31:47 } +2024-07-25 23:40:41,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1137/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 5.430815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44085 samples/s/p 1:31:36 } +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1139/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 5.4263337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43081 samples/s/p 1:31:43 } +2024-07-25 23:40:47,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1141/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 5.4218544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:47,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44146 samples/s/p 1:31:29 } +2024-07-25 23:40:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1143/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.4173765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:50,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43810 samples/s/p 1:31:30 } +2024-07-25 23:40:53,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1145/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.4129005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:53,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43627 samples/s/p 1:31:29 } +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1147/ 1625], loss: 1.098, per_step_time: 1475ms, lr: 5.4084253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.42039 samples/s/p 1:31:42 } +2024-07-25 23:40:59,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1149/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 5.4039533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43479 samples/s/p 1:31:24 } +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1151/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 5.3994845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43090 samples/s/p 1:31:25 } +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1153/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 5.3950143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43620 samples/s/p 1:31:17 } +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1155/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 5.390547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.42882 samples/s/p 1:31:21 } +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1157/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.386085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:11,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43442 samples/s/p 1:31:13 } +2024-07-25 23:41:14,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1159/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 5.3816193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43963 samples/s/p 1:31:05 } +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1161/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 5.377158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43921 samples/s/p 1:31:02 } +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1163/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 5.372701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43915 samples/s/p 1:30:59 } +2024-07-25 23:41:23,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1165/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.368241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:23,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43375 samples/s/p 1:31:02 } +2024-07-25 23:41:25,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.363788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:25,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43531 samples/s/p 1:30:57 } +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1169/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.359334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43792 samples/s/p 1:30:52 } +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1171/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 5.3548797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43791 samples/s/p 1:30:49 } +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1173/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 5.350432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43228 samples/s/p 1:30:51 } +2024-07-25 23:41:37,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1175/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 5.3459844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43467 samples/s/p 1:30:46 } +2024-07-25 23:41:40,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1177/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.341535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:40,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43147 samples/s/p 1:30:46 } +2024-07-25 23:41:43,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1179/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 5.3370936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:43,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43686 samples/s/p 1:30:38 } +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1181/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 5.3326517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43079 samples/s/p 1:30:41 } +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1183/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 5.328211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:49,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.42466 samples/s/p 1:30:44 } +2024-07-25 23:41:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1185/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.323772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:52,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43818 samples/s/p 1:30:28 } +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1187/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.319335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43563 samples/s/p 1:30:27 } +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1189/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 5.3149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43639 samples/s/p 1:30:24 } +2024-07-25 23:42:01,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1191/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.3104673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:01,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43205 samples/s/p 1:30:25 } +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1193/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.306036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:04,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43211 samples/s/p 1:30:22 } +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1195/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 5.301609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43543 samples/s/p 1:30:16 } +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1197/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 5.2971795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43759 samples/s/p 1:30:11 } +2024-07-25 23:42:13,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1199/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 5.2927535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:13,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43712 samples/s/p 1:30:08 } +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1201/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 5.288333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:16,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.44071 samples/s/p 1:30:02 } +2024-07-25 23:42:19,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1203/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 5.2839086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:19,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43040 samples/s/p 1:30:09 } +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1205/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.2794885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43679 samples/s/p 1:30:00 } +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1207/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 5.275073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43502 samples/s/p 1:29:59 } +2024-07-25 23:42:27,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1209/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 5.270654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43521 samples/s/p 1:29:55 } +2024-07-25 23:42:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1211/ 1625], loss: 0.974, per_step_time: 1474ms, lr: 5.266243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:30,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42422 samples/s/p 1:30:03 } +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1213/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 5.2618298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43853 samples/s/p 1:29:46 } +2024-07-25 23:42:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1215/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.257417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43545 samples/s/p 1:29:46 } +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1217/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 5.253011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:39,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43561 samples/s/p 1:29:43 } +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1219/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 5.248604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43253 samples/s/p 1:29:43 } +2024-07-25 23:42:45,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1221/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 5.244197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42825 samples/s/p 1:29:45 } +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1223/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 5.2397972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43066 samples/s/p 1:29:39 } +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1225/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 5.2353953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42971 samples/s/p 1:29:37 } +2024-07-25 23:42:51,585 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1227/ 1625], loss: 0.972, per_step_time: 1472ms, lr: 5.230997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43226 samples/s/p 1:29:32 } +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1229/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 5.226599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42812 samples/s/p 1:29:33 } +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1231/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 5.222204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43463 samples/s/p 1:29:24 } +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1233/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 5.21781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42928 samples/s/p 1:29:26 } +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1235/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 5.2134196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43292 samples/s/p 1:29:19 } +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1237/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 5.20903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43137 samples/s/p 1:29:18 } +2024-07-25 23:43:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1239/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 5.204644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43744 samples/s/p 1:29:09 } +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1241/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 5.200256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43643 samples/s/p 1:29:07 } +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1243/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 5.1958723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42925 samples/s/p 1:29:11 } +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1245/ 1625], loss: 0.898, per_step_time: 1471ms, lr: 5.1914926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43616 samples/s/p 1:29:02 } +2024-07-25 23:43:56,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1247/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.1871107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:56,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43571 samples/s/p 1:28:59 } +2024-07-25 23:43:59,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1249/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.1827324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:59,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43630 samples/s/p 1:28:55 } +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1251/ 1625], loss: 1.108, per_step_time: 1476ms, lr: 5.178358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.41861 samples/s/p 1:29:10 } +2024-07-25 23:44:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1253/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 5.1739808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.42997 samples/s/p 1:28:56 } +2024-07-25 23:44:08,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1255/ 1625], loss: 1.357, per_step_time: 1470ms, lr: 5.169611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:08,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43889 samples/s/p 1:28:44 } +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1257/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 5.1652405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:11,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43517 samples/s/p 1:28:45 } +2024-07-25 23:44:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1259/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 5.1608695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43986 samples/s/p 1:28:37 } +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1261/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 5.1565053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:17,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43504 samples/s/p 1:28:39 } +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1263/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.1521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43601 samples/s/p 1:28:35 } +2024-07-25 23:44:23,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1265/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 5.147777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:23,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44080 samples/s/p 1:28:28 } +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1267/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 5.143416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43066 samples/s/p 1:28:35 } +2024-07-25 23:44:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1269/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 5.1390575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44141 samples/s/p 1:28:21 } +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1271/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 5.1346997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:32,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43701 samples/s/p 1:28:22 } +2024-07-25 23:44:35,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1273/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 5.1303446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:35,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43592 samples/s/p 1:28:21 } +2024-07-25 23:44:38,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1275/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 5.1259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:38,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43825 samples/s/p 1:28:15 } +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1277/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 5.12164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:41,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42854 samples/s/p 1:28:22 } +2024-07-25 23:44:43,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1279/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.1172897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:43,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43419 samples/s/p 1:28:13 } +2024-07-25 23:44:46,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1281/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 5.1129427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:46,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43125 samples/s/p 1:28:13 } +2024-07-25 23:44:49,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1283/ 1625], loss: 0.895, per_step_time: 1470ms, lr: 5.108599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:49,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43909 samples/s/p 1:28:03 } +2024-07-25 23:44:52,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1285/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 5.1042534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:53,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.44006 samples/s/p 1:27:59 } +2024-07-25 23:44:56,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1287/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 5.099911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:56,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42471 samples/s/p 1:28:11 } +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1289/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 5.095573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:59,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43323 samples/s/p 1:28:00 } +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1291/ 1625], loss: 1.193, per_step_time: 1475ms, lr: 5.091233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42157 samples/s/p 1:28:08 } +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1293/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 5.086899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43027 samples/s/p 1:27:57 } +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1295/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 5.082565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.44146 samples/s/p 1:27:43 } +2024-07-25 23:45:11,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1297/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 5.07823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:11,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43227 samples/s/p 1:27:49 } +2024-07-25 23:45:14,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1299/ 1625], loss: 1.252, per_step_time: 1475ms, lr: 5.073902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:14,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.42343 samples/s/p 1:27:54 } +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1301/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 5.0695744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43418 samples/s/p 1:27:41 } +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1303/ 1625], loss: 1.122, per_step_time: 1475ms, lr: 5.0652447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.42174 samples/s/p 1:27:50 } +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1305/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.0609233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43843 samples/s/p 1:27:31 } +2024-07-25 23:45:25,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1307/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 5.0566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:25,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43942 samples/s/p 1:27:27 } +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1309/ 1625], loss: 1.139, per_step_time: 1477ms, lr: 5.05228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.41375 samples/s/p 1:27:49 } +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1311/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 5.0479603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43462 samples/s/p 1:27:26 } +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1313/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 5.043644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43146 samples/s/p 1:27:26 } +2024-07-25 23:45:37,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1315/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 5.0393287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:37,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43008 samples/s/p 1:27:24 } +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1317/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 5.035016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43190 samples/s/p 1:27:20 } +2024-07-25 23:45:43,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1319/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 5.030705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:43,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42911 samples/s/p 1:27:19 } +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1321/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 5.0263957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43080 samples/s/p 1:27:15 } +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1323/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 5.0220883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:49,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43953 samples/s/p 1:27:03 } +2024-07-25 23:45:52,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1325/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.017783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:52,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43379 samples/s/p 1:27:06 } +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1327/ 1625], loss: 1.387, per_step_time: 1470ms, lr: 5.01348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:55,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43891 samples/s/p 1:26:58 } +2024-07-25 23:45:58,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1329/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 5.0091776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:58,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42572 samples/s/p 1:27:08 } +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1331/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 5.004879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:01,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42982 samples/s/p 1:27:01 } +2024-07-25 23:46:04,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1333/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.000584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:04,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43338 samples/s/p 1:26:55 } +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1335/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 4.9962855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42510 samples/s/p 1:27:00 } +2024-07-25 23:46:10,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1337/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 4.9919945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:10,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43508 samples/s/p 1:26:47 } +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1339/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 4.9877026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43425 samples/s/p 1:26:45 } +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1341/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 4.9834107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:16,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43663 samples/s/p 1:26:40 } +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1343/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 4.9791247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:19,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.42932 samples/s/p 1:26:44 } +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1345/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.9748396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43632 samples/s/p 1:26:34 } +2024-07-25 23:46:25,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1347/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 4.9705527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:25,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43610 samples/s/p 1:26:31 } +2024-07-25 23:46:28,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1349/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 4.966273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:28,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43301 samples/s/p 1:26:31 } +2024-07-25 23:46:30,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1351/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 4.961993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:30,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43462 samples/s/p 1:26:27 } +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1353/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 4.957715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:33,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43789 samples/s/p 1:26:21 } +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1355/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 4.9534397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:36,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43690 samples/s/p 1:26:19 } +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1357/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 4.949165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43143 samples/s/p 1:26:21 } +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1359/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 4.9448927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43906 samples/s/p 1:26:11 } +2024-07-25 23:46:45,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1361/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 4.9406226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:45,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43739 samples/s/p 1:26:10 } +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1363/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 4.936354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:48,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43603 samples/s/p 1:26:08 } +2024-07-25 23:46:51,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1365/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 4.932088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:51,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43883 samples/s/p 1:26:02 } +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1367/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 4.9278233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43244 samples/s/p 1:26:06 } +2024-07-25 23:46:57,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1369/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 4.92356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:57,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43564 samples/s/p 1:26:00 } +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1371/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.919299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43009 samples/s/p 1:26:02 } +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1373/ 1625], loss: 1.125, per_step_time: 1483ms, lr: 4.915041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.39402 samples/s/p 1:26:33 } +2024-07-25 23:47:06,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1375/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 4.9107844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:06,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43989 samples/s/p 1:25:47 } +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1377/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 4.9065297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:09,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43127 samples/s/p 1:25:52 } +2024-07-25 23:47:12,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1379/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 4.9022765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:12,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43302 samples/s/p 1:25:47 } +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1381/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 4.8980287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43773 samples/s/p 1:25:40 } +2024-07-25 23:47:18,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1383/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 4.8937773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:18,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43482 samples/s/p 1:25:40 } +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1385/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 4.8895304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43396 samples/s/p 1:25:38 } +2024-07-25 23:47:24,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1387/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 4.8852876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:24,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.42993 samples/s/p 1:25:38 } +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1389/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 4.881045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43606 samples/s/p 1:25:30 } +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1391/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 4.8768015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43093 samples/s/p 1:25:32 } +2024-07-25 23:47:32,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1393/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 4.8725647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:32,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43000 samples/s/p 1:25:30 } +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1395/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 4.8683273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.44134 samples/s/p 1:25:16 } +2024-07-25 23:47:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1397/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 4.8640923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:38,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43995 samples/s/p 1:25:14 } +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1399/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.85986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:41,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43125 samples/s/p 1:25:19 } +2024-07-25 23:47:44,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1401/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 4.8556276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:44,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43083 samples/s/p 1:25:17 } +2024-07-25 23:47:47,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1403/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 4.851399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:47,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43332 samples/s/p 1:25:12 } +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1405/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 4.8471716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:50,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43393 samples/s/p 1:25:08 } +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1407/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 4.8429465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43472 samples/s/p 1:25:04 } +2024-07-25 23:47:56,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1409/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 4.8387237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:56,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43769 samples/s/p 1:24:59 } +2024-07-25 23:47:59,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1411/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 4.8345014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:59,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43565 samples/s/p 1:24:58 } +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1413/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 4.8302823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43648 samples/s/p 1:24:54 } +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1415/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 4.8260645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43762 samples/s/p 1:24:50 } +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1417/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.8218494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43338 samples/s/p 1:24:51 } +2024-07-25 23:48:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1419/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 4.817638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:11,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43618 samples/s/p 1:24:45 } +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1421/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 4.8134248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43727 samples/s/p 1:24:41 } +2024-07-25 23:48:17,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1423/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 4.809215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:17,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43585 samples/s/p 1:24:40 } +2024-07-25 23:48:20,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1425/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 4.8050097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43442 samples/s/p 1:24:38 } +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1427/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.8008023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43660 samples/s/p 1:24:33 } +2024-07-25 23:48:26,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1429/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 4.796598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:26,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43374 samples/s/p 1:24:33 } +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1431/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 4.792399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:29,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.44111 samples/s/p 1:24:23 } +2024-07-25 23:48:31,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1433/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 4.7881967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:31,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43470 samples/s/p 1:24:26 } +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1435/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 4.7840017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43600 samples/s/p 1:24:22 } +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1437/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 4.7798057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:37,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43560 samples/s/p 1:24:19 } +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1439/ 1625], loss: 0.954, per_step_time: 1472ms, lr: 4.775612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43153 samples/s/p 1:24:20 } +2024-07-25 23:48:43,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1441/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 4.7714207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:43,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43172 samples/s/p 1:24:17 } +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1443/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 4.7672306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43081 samples/s/p 1:24:15 } +2024-07-25 23:48:49,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1445/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 4.7630424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:49,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42772 samples/s/p 1:24:15 } +2024-07-25 23:48:52,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1447/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 4.758857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:52,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43692 samples/s/p 1:24:04 } +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1449/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 4.7546737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43031 samples/s/p 1:24:07 } +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1451/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 4.7504914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43064 samples/s/p 1:24:03 } +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1453/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 4.746311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:01,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42906 samples/s/p 1:24:02 } +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1455/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 4.742134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43978 samples/s/p 1:23:49 } +2024-07-25 23:49:07,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1457/ 1625], loss: 1.376, per_step_time: 1471ms, lr: 4.737958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:07,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43748 samples/s/p 1:23:48 } +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1459/ 1625], loss: 1.180, per_step_time: 1475ms, lr: 4.7337835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.42229 samples/s/p 1:23:59 } +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1461/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.7296116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43497 samples/s/p 1:23:45 } +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1463/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 4.7254443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43964 samples/s/p 1:23:37 } +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1465/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 4.721274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44085 samples/s/p 1:23:33 } +2024-07-25 23:49:22,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1467/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 4.7171084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:22,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44280 samples/s/p 1:23:29 } +2024-07-25 23:49:25,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1469/ 1625], loss: 1.019, per_step_time: 1469ms, lr: 4.712947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:25,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44394 samples/s/p 1:23:25 } +2024-07-25 23:49:28,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1471/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 4.708782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:28,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43622 samples/s/p 1:23:29 } +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1473/ 1625], loss: 1.039, per_step_time: 1475ms, lr: 4.7046224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42330 samples/s/p 1:23:38 } +2024-07-25 23:49:33,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1475/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 4.700467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:33,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42981 samples/s/p 1:23:29 } +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1477/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.6963078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:36,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43175 samples/s/p 1:23:24 } +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1479/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 4.692157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43762 samples/s/p 1:23:16 } +2024-07-25 23:49:42,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1481/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 4.688005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:42,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43201 samples/s/p 1:23:18 } +2024-07-25 23:49:45,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1483/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 4.6838522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:45,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43662 samples/s/p 1:23:11 } +2024-07-25 23:49:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1485/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 4.6797063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:48,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43266 samples/s/p 1:23:12 } +2024-07-25 23:49:51,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1487/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 4.6755604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:51,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.42971 samples/s/p 1:23:11 } +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1489/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 4.6714163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43420 samples/s/p 1:23:04 } +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1491/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 4.667274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43096 samples/s/p 1:23:04 } +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 4.663134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:00,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43852 samples/s/p 1:22:54 } +2024-07-25 23:50:03,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1495/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 4.6589967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:03,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43482 samples/s/p 1:22:55 } +2024-07-25 23:50:06,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1497/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 4.6548603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43560 samples/s/p 1:22:51 } +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1499/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 4.6507257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:09,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43687 samples/s/p 1:22:47 } +2024-07-25 23:50:12,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1501/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 4.6465934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:12,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43233 samples/s/p 1:22:48 } +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1503/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.6424643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43463 samples/s/p 1:22:43 } +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1505/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 4.6383366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43312 samples/s/p 1:22:42 } +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1507/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 4.634212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43067 samples/s/p 1:22:41 } +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1509/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 4.630086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43681 samples/s/p 1:22:32 } +2024-07-25 23:50:27,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1511/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 4.6259643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43561 samples/s/p 1:22:31 } +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1513/ 1625], loss: 1.123, per_step_time: 1482ms, lr: 4.621846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:30,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.39672 samples/s/p 1:23:03 } +2024-07-25 23:50:33,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1515/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 4.617726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:33,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.44164 samples/s/p 1:22:19 } +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1517/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 4.6136106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43029 samples/s/p 1:22:27 } +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1519/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 4.6094983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:38,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43793 samples/s/p 1:22:17 } +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1521/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 4.6053838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.44177 samples/s/p 1:22:10 } +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1523/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 4.6012765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43040 samples/s/p 1:22:18 } +2024-07-25 23:50:47,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1525/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 4.5971688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:47,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43240 samples/s/p 1:22:13 } +2024-07-25 23:50:50,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1527/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 4.593061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:50,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43317 samples/s/p 1:22:09 } +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1529/ 1625], loss: 1.167, per_step_time: 1470ms, lr: 4.588959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:53,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43923 samples/s/p 1:22:01 } +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1531/ 1625], loss: 1.281, per_step_time: 1474ms, lr: 4.5848574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.42481 samples/s/p 1:22:11 } +2024-07-25 23:50:59,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1533/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 4.5807546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:59,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43922 samples/s/p 1:21:55 } +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1535/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 4.5766587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43604 samples/s/p 1:21:55 } +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1537/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 4.5725637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43493 samples/s/p 1:21:53 } +2024-07-25 23:51:08,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1539/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 4.568469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43686 samples/s/p 1:21:48 } +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1541/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 4.5643774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43997 samples/s/p 1:21:42 } +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1543/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 4.560288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43743 samples/s/p 1:21:42 } +2024-07-25 23:51:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1545/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 4.5561997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.42862 samples/s/p 1:21:47 } +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1547/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.5521147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43419 samples/s/p 1:21:39 } +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1549/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.548031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43757 samples/s/p 1:21:33 } +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1551/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 4.5439515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43546 samples/s/p 1:21:32 } +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1553/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 4.5398697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43437 samples/s/p 1:21:30 } +2024-07-25 23:51:32,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1555/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 4.535792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:32,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43612 samples/s/p 1:21:25 } +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1557/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 4.531719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43283 samples/s/p 1:21:25 } +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1559/ 1625], loss: 1.250, per_step_time: 1469ms, lr: 4.527643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.44370 samples/s/p 1:21:13 } +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1561/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 4.523571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43873 samples/s/p 1:21:14 } +2024-07-25 23:51:43,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1563/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.519503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:43,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43197 samples/s/p 1:21:17 } +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1565/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 4.5154343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43030 samples/s/p 1:21:16 } +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1567/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 4.51137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43674 samples/s/p 1:21:07 } +2024-07-25 23:51:52,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1569/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 4.5073075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44318 samples/s/p 1:20:58 } +2024-07-25 23:51:55,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1571/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 4.503243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:55,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44159 samples/s/p 1:20:57 } +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1573/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.4991866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43329 samples/s/p 1:21:01 } +2024-07-25 23:52:01,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1575/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 4.495129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44040 samples/s/p 1:20:52 } +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1577/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 4.491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43525 samples/s/p 1:20:54 } +2024-07-25 23:52:07,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1579/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 4.4870203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:07,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43919 samples/s/p 1:20:47 } +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1581/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 4.482969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43586 samples/s/p 1:20:47 } +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1583/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 4.47892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.42951 samples/s/p 1:20:50 } +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1585/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 4.474872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:16,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43608 samples/s/p 1:20:41 } +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1587/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 4.4708277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43321 samples/s/p 1:20:41 } +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1589/ 1625], loss: 1.270, per_step_time: 1474ms, lr: 4.4667863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42576 samples/s/p 1:20:45 } +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1591/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.4627423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43291 samples/s/p 1:20:35 } +2024-07-25 23:52:28,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1593/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 4.4587036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:28,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43079 samples/s/p 1:20:34 } +2024-07-25 23:52:31,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.454668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:31,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43266 samples/s/p 1:20:30 } +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1597/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.4506323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43782 samples/s/p 1:20:22 } +2024-07-25 23:52:36,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1599/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 4.4465987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:36,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43310 samples/s/p 1:20:23 } +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1601/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 4.4425697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43221 samples/s/p 1:20:21 } +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1603/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 4.4385383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:42,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.42928 samples/s/p 1:20:21 } +2024-07-25 23:52:45,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1605/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 4.4345143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:45,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43461 samples/s/p 1:20:13 } +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1607/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 4.4304898e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:48,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43901 samples/s/p 1:20:06 } +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1609/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 4.426465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43597 samples/s/p 1:20:06 } +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1611/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.4224466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43440 samples/s/p 1:20:04 } +2024-07-25 23:52:57,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1613/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 4.418427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:57,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43750 samples/s/p 1:19:59 } +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1615/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 4.414409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43890 samples/s/p 1:19:55 } +2024-07-25 23:53:03,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1617/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 4.4103963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:03,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43167 samples/s/p 1:19:58 } +2024-07-25 23:53:06,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1619/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 4.4063836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:06,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43873 samples/s/p 1:19:49 } +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1621/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.402373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43546 samples/s/p 1:19:49 } +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1623/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.3983646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43272 samples/s/p 1:19:48 } +2024-07-25 23:53:15,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1625/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 4.394358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:15,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43447 samples/s/p 1:19:44 } +2024-07-25 23:53:18,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 2/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 4.3903538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42857 samples/s/p 1:19:46 } +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 4/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 4.3863524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43307 samples/s/p 1:19:39 } +2024-07-25 23:53:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 6/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 4.3823516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:24,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42605 samples/s/p 1:19:42 } +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 8/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 4.3783525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:27,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43563 samples/s/p 1:19:31 } +2024-07-25 23:53:30,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 10/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.374357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:30,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43844 samples/s/p 1:19:26 } +2024-07-25 23:53:33,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 12/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.3703635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:33,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43434 samples/s/p 1:19:26 } +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 14/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 4.366374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43623 samples/s/p 1:19:22 } +2024-07-25 23:53:38,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 16/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 4.362382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:38,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43190 samples/s/p 1:19:22 } +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 18/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 4.358393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43794 samples/s/p 1:19:14 } +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 20/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 4.35441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43429 samples/s/p 1:19:14 } +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 22/ 1625], loss: 1.292, per_step_time: 1475ms, lr: 4.350423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42284 samples/s/p 1:19:22 } +2024-07-25 23:53:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 24/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 4.3464447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:50,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42781 samples/s/p 1:19:14 } +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 26/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 4.342464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43721 samples/s/p 1:19:03 } +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 28/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 4.338484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43928 samples/s/p 1:18:58 } +2024-07-25 23:53:59,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 30/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 4.334511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:59,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43762 samples/s/p 1:18:57 } +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 32/ 1625], loss: 1.037, per_step_time: 1469ms, lr: 4.330538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.44353 samples/s/p 1:18:49 } +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 34/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 4.326564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43536 samples/s/p 1:18:53 } +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 36/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 4.3225964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42706 samples/s/p 1:18:57 } +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 38/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 4.318629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42544 samples/s/p 1:18:56 } +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 40/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 4.3146647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43651 samples/s/p 1:18:43 } +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 42/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 4.310701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43852 samples/s/p 1:18:38 } +2024-07-25 23:54:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 44/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 4.3067403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43567 samples/s/p 1:18:38 } +2024-07-25 23:54:23,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 46/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 4.3027812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:23,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.42667 samples/s/p 1:18:43 } +2024-07-25 23:54:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 48/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 4.2988236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43680 samples/s/p 1:18:31 } +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 50/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 4.2948686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43240 samples/s/p 1:18:32 } +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 52/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 4.2909155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:32,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43970 samples/s/p 1:18:23 } +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 54/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 4.286965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.44127 samples/s/p 1:18:18 } +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 56/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 4.283017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43422 samples/s/p 1:18:22 } +2024-07-25 23:54:40,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 58/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 4.2790707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:40,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43420 samples/s/p 1:18:19 } +2024-07-25 23:54:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 60/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 4.2751253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43373 samples/s/p 1:18:16 } +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 62/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 4.2711836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43937 samples/s/p 1:18:08 } +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 64/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 4.267245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43975 samples/s/p 1:18:05 } +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 66/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 4.263304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43313 samples/s/p 1:18:08 } +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 68/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 4.2593706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43140 samples/s/p 1:18:06 } +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 70/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 4.2554357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43096 samples/s/p 1:18:04 } +2024-07-25 23:55:01,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 72/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 4.2515017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:01,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43403 samples/s/p 1:17:58 } +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 74/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 4.2475735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:04,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43702 samples/s/p 1:17:53 } +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 76/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 4.2436454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43986 samples/s/p 1:17:47 } +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 78/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 4.2397182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43990 samples/s/p 1:17:44 } +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 80/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 4.235796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43516 samples/s/p 1:17:45 } +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 82/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 4.231874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:16,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43785 samples/s/p 1:17:40 } +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 84/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.2279544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42850 samples/s/p 1:17:45 } +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 86/ 1625], loss: 1.093, per_step_time: 1477ms, lr: 4.2240367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.41360 samples/s/p 1:17:55 } +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 88/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 4.220122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42887 samples/s/p 1:17:39 } +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 90/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 4.2162083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:28,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43219 samples/s/p 1:17:33 } +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 92/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 4.2122965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:31,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43164 samples/s/p 1:17:31 } +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 94/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 4.2083875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43520 samples/s/p 1:17:25 } +2024-07-25 23:55:36,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 96/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 4.2044812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:36,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43600 samples/s/p 1:17:21 } +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 98/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.2005754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43599 samples/s/p 1:17:18 } +2024-07-25 23:55:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 100/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 4.1966723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:42,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43773 samples/s/p 1:17:14 } +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 102/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 4.192771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43385 samples/s/p 1:17:14 } +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 104/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 4.1888734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:48,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43226 samples/s/p 1:17:13 } +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 106/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.1849753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:51,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43622 samples/s/p 1:17:06 } +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 108/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.181081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:54,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43365 samples/s/p 1:17:05 } +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 110/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 4.177189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:57,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43287 samples/s/p 1:17:03 } +2024-07-25 23:56:00,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 112/ 1625], loss: 1.520, per_step_time: 1473ms, lr: 4.1733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:00,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43053 samples/s/p 1:17:02 } +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 114/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 4.1694116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:03,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43570 samples/s/p 1:16:55 } +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 116/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 4.1655235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.44120 samples/s/p 1:16:47 } +2024-07-25 23:56:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 118/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 4.1616418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:09,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43759 samples/s/p 1:16:47 } +2024-07-25 23:56:12,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 120/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 4.1577587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:12,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43254 samples/s/p 1:16:49 } +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 122/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 4.15388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44508 samples/s/p 1:16:35 } +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 124/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 4.150001e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42812 samples/s/p 1:16:47 } +2024-07-25 23:56:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 126/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 4.146126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:21,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43549 samples/s/p 1:16:37 } +2024-07-25 23:56:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 128/ 1625], loss: 0.937, per_step_time: 1474ms, lr: 4.1422522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:24,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42720 samples/s/p 1:16:42 } +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 130/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 4.13838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44100 samples/s/p 1:16:27 } +2024-07-25 23:56:30,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 132/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 4.134511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43751 samples/s/p 1:16:27 } +2024-07-25 23:56:33,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 134/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 4.1306434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:33,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44062 samples/s/p 1:16:21 } +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 136/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.126778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43629 samples/s/p 1:16:22 } +2024-07-25 23:56:38,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 138/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 4.122915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:38,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42900 samples/s/p 1:16:25 } +2024-07-25 23:56:41,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 140/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 4.1190533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:41,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.44029 samples/s/p 1:16:13 } +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 142/ 1625], loss: 1.094, per_step_time: 1478ms, lr: 4.1151943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.41261 samples/s/p 1:16:33 } +2024-07-25 23:56:47,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 144/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.111337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:47,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43771 samples/s/p 1:16:09 } +2024-07-25 23:56:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 146/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 4.1074827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43069 samples/s/p 1:16:12 } +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 148/ 1625], loss: 1.280, per_step_time: 1476ms, lr: 4.1036305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:53,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.41957 samples/s/p 1:16:18 } +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 150/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.099782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:56,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43491 samples/s/p 1:16:03 } +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 152/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 4.0959317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43945 samples/s/p 1:15:56 } +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 154/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 4.092085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:02,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43012 samples/s/p 1:16:01 } +2024-07-25 23:57:05,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 156/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 4.0882423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:05,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43459 samples/s/p 1:15:54 } +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 158/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 4.084398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43956 samples/s/p 1:15:47 } +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 160/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 4.080558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43128 samples/s/p 1:15:51 } +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 162/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 4.076722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43631 samples/s/p 1:15:44 } +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 164/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 4.072886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:17,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43522 samples/s/p 1:15:42 } +2024-07-25 23:57:20,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 166/ 1625], loss: 0.903, per_step_time: 1471ms, lr: 4.069052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43802 samples/s/p 1:15:36 } +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 168/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.0652208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43596 samples/s/p 1:15:35 } +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 170/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 4.0613913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:26,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43629 samples/s/p 1:15:32 } +2024-07-25 23:57:29,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 172/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.0575633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:29,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43656 samples/s/p 1:15:29 } +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 174/ 1625], loss: 1.329, per_step_time: 1482ms, lr: 4.0537384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.39608 samples/s/p 1:16:00 } +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 176/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 4.0499153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.44206 samples/s/p 1:15:18 } +2024-07-25 23:57:38,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 178/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 4.0460936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:38,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43823 samples/s/p 1:15:19 } +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 180/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 4.0422756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43373 samples/s/p 1:15:19 } +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 182/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 4.038459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43627 samples/s/p 1:15:14 } +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 184/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 4.034644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43338 samples/s/p 1:15:14 } +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 186/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 4.030831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:49,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43401 samples/s/p 1:15:10 } +2024-07-25 23:57:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 188/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 4.027021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43981 samples/s/p 1:15:03 } +2024-07-25 23:57:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 190/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.023212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:55,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43505 samples/s/p 1:15:04 } +2024-07-25 23:57:58,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 192/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 4.019406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:58,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.42150 samples/s/p 1:15:12 } +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 194/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 4.015604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43291 samples/s/p 1:14:59 } +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 196/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 4.0118007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43807 samples/s/p 1:14:52 } +2024-07-25 23:58:07,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 198/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.0080004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:07,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43650 samples/s/p 1:14:51 } +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 200/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.0042046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43654 samples/s/p 1:14:48 } +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 202/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.000406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43692 samples/s/p 1:14:44 } +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 204/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.9966126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43447 samples/s/p 1:14:43 } +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 206/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 3.9928236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:19,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43995 samples/s/p 1:14:36 } +2024-07-25 23:58:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 208/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 3.9890315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43429 samples/s/p 1:14:38 } +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 210/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 3.9852466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43444 samples/s/p 1:14:35 } +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 212/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 3.9814613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:28,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43382 samples/s/p 1:14:32 } +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 214/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 3.977679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43926 samples/s/p 1:14:25 } +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 216/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 3.973899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43892 samples/s/p 1:14:22 } +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 218/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 3.9701185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43296 samples/s/p 1:14:24 } +2024-07-25 23:58:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 220/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 3.9663437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:39,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43353 samples/s/p 1:14:21 } +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 222/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 3.9625684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:42,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43561 samples/s/p 1:14:16 } +2024-07-25 23:58:45,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 224/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.958796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:45,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43767 samples/s/p 1:14:11 } +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 226/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 3.955026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44075 samples/s/p 1:14:06 } +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 228/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 3.951258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43645 samples/s/p 1:14:07 } +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 230/ 1625], loss: 1.118, per_step_time: 1469ms, lr: 3.947492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44224 samples/s/p 1:13:59 } +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 232/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 3.943728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:57,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44178 samples/s/p 1:13:56 } +2024-07-25 23:59:00,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 234/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 3.939966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:00,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44365 samples/s/p 1:13:52 } +2024-07-25 23:59:03,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 236/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.936207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:03,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.44044 samples/s/p 1:13:51 } +2024-07-25 23:59:06,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 238/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.9324523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:06,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43481 samples/s/p 1:13:53 } +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 240/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.928695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43424 samples/s/p 1:13:51 } +2024-07-25 23:59:12,415 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 242/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 3.9249417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43352 samples/s/p 1:13:48 } +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 244/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 3.9211923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43831 samples/s/p 1:13:41 } +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 246/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 3.9174415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43081 samples/s/p 1:13:45 } +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 248/ 1625], loss: 1.137, per_step_time: 1482ms, lr: 3.913695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.39803 samples/s/p 1:14:09 } +2024-07-25 23:59:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 250/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 3.9099527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:24,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.42819 samples/s/p 1:13:41 } +2024-07-25 23:59:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 252/ 1625], loss: 1.115, per_step_time: 1467ms, lr: 3.906208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:27,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.44970 samples/s/p 1:13:20 } +2024-07-25 23:59:30,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 254/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.90247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:30,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43718 samples/s/p 1:13:28 } +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 256/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 3.898732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:33,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43735 samples/s/p 1:13:25 } +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 258/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.894994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43652 samples/s/p 1:13:22 } +2024-07-25 23:59:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 260/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 3.891262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43975 samples/s/p 1:13:17 } +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 262/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.88753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:41,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43677 samples/s/p 1:13:16 } +2024-07-25 23:59:44,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 264/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 3.8838007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43497 samples/s/p 1:13:15 } +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 266/ 1625], loss: 0.961, per_step_time: 1471ms, lr: 3.880073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43785 samples/s/p 1:13:09 } +2024-07-25 23:59:50,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 268/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.8763483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:50,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43184 samples/s/p 1:13:11 } +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 270/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 3.872625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43818 samples/s/p 1:13:03 } +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 272/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 3.868904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43107 samples/s/p 1:13:06 } +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 274/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 3.865185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43452 samples/s/p 1:13:00 } +2024-07-26 00:00:02,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 276/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 3.861469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:02,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43172 samples/s/p 1:13:00 } +2024-07-26 00:00:05,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 278/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 3.8577537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:05,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.44089 samples/s/p 1:12:49 } +2024-07-26 00:00:08,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 280/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 3.8540416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:08,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43633 samples/s/p 1:12:50 } +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 282/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.8503335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:11,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43986 samples/s/p 1:12:44 } +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 284/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.8466233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43024 samples/s/p 1:12:49 } +2024-07-26 00:00:17,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 286/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 3.8429175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:17,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43207 samples/s/p 1:12:45 } +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 288/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 3.839216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43063 samples/s/p 1:12:43 } +2024-07-26 00:00:23,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 290/ 1625], loss: 0.970, per_step_time: 1473ms, lr: 3.8355124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:23,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43057 samples/s/p 1:12:40 } +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 292/ 1625], loss: 1.233, per_step_time: 1469ms, lr: 3.8318144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.44284 samples/s/p 1:12:27 } +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 294/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.828117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43106 samples/s/p 1:12:34 } +2024-07-26 00:00:32,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 296/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 3.8244198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43221 samples/s/p 1:12:30 } +2024-07-26 00:00:35,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 298/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 3.820728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:35,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43733 samples/s/p 1:12:23 } +2024-07-26 00:00:38,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 300/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 3.817038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:38,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43447 samples/s/p 1:12:22 } +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 302/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 3.8133467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43626 samples/s/p 1:12:18 } +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 304/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 3.8096632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43246 samples/s/p 1:12:18 } +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 306/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 3.8059788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42224 samples/s/p 1:12:23 } +2024-07-26 00:00:49,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 308/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 3.802295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:49,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43409 samples/s/p 1:12:11 } +2024-07-26 00:00:52,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 310/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 3.798616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:52,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43549 samples/s/p 1:12:07 } +2024-07-26 00:00:55,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 312/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 3.7949385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:55,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42224 samples/s/p 1:12:14 } +2024-07-26 00:00:58,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 314/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.7912619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:58,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42920 samples/s/p 1:12:06 } +2024-07-26 00:01:01,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 316/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 3.7875889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:01,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43545 samples/s/p 1:11:58 } +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 318/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 3.7839172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:04,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43115 samples/s/p 1:11:58 } +2024-07-26 00:01:07,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 320/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 3.7802492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:07,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.44028 samples/s/p 1:11:48 } +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.7765808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43997 samples/s/p 1:11:45 } +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 324/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.772916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:13,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43571 samples/s/p 1:11:46 } +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 326/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 3.7692557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:16,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.44007 samples/s/p 1:11:39 } +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 328/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 3.7655932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:19,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43480 samples/s/p 1:11:41 } +2024-07-26 00:01:22,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 3.7619338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43953 samples/s/p 1:11:34 } +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 332/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 3.75828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:25,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43385 samples/s/p 1:11:36 } +2024-07-26 00:01:28,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 334/ 1625], loss: 1.120, per_step_time: 1469ms, lr: 3.7546238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:28,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44273 samples/s/p 1:11:26 } +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 336/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 3.750974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:31,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43943 samples/s/p 1:11:25 } +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 338/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 3.7473242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:34,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43574 samples/s/p 1:11:25 } +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 340/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 3.7436744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43531 samples/s/p 1:11:23 } +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 342/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 3.740031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43516 samples/s/p 1:11:20 } +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 344/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 3.736388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:42,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43013 samples/s/p 1:11:21 } +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 346/ 1625], loss: 0.863, per_step_time: 1471ms, lr: 3.732745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43588 samples/s/p 1:11:13 } +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 348/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.7291084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:48,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43751 samples/s/p 1:11:09 } +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 3.7254713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:51,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42965 samples/s/p 1:11:12 } +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 352/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.721836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43672 samples/s/p 1:11:04 } +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 354/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 3.7182035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43139 samples/s/p 1:11:05 } +2024-07-26 00:02:00,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 356/ 1625], loss: 1.363, per_step_time: 1475ms, lr: 3.7145737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:00,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42280 samples/s/p 1:11:09 } +2024-07-26 00:02:03,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 358/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 3.7109462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42710 samples/s/p 1:11:03 } +2024-07-26 00:02:06,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 360/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 3.70732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43854 samples/s/p 1:10:51 } +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 362/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 3.7036962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43598 samples/s/p 1:10:50 } +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 364/ 1625], loss: 1.313, per_step_time: 1474ms, lr: 3.7000773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42399 samples/s/p 1:10:56 } +2024-07-26 00:02:15,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 366/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 3.6964552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:15,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43823 samples/s/p 1:10:42 } +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 368/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 3.6928382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43408 samples/s/p 1:10:42 } +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 370/ 1625], loss: 1.399, per_step_time: 1473ms, lr: 3.6892257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42746 samples/s/p 1:10:45 } +2024-07-26 00:02:24,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 372/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 3.6856104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:24,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42838 samples/s/p 1:10:41 } +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 374/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6819997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43598 samples/s/p 1:10:32 } +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 376/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 3.678394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43185 samples/s/p 1:10:32 } +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 378/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 3.6747856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42888 samples/s/p 1:10:32 } +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 380/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 3.671183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42644 samples/s/p 1:10:31 } +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 382/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 3.667582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43311 samples/s/p 1:10:22 } +2024-07-26 00:02:41,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 384/ 1625], loss: 1.105, per_step_time: 1474ms, lr: 3.6639794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42482 samples/s/p 1:10:26 } +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 386/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 3.6603833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43392 samples/s/p 1:10:16 } +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 388/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.656788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43373 samples/s/p 1:10:13 } +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 390/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6531942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:50,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42994 samples/s/p 1:10:13 } +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 392/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 3.6496049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:53,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43857 samples/s/p 1:10:04 } +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 394/ 1625], loss: 0.928, per_step_time: 1473ms, lr: 3.6460156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:56,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42827 samples/s/p 1:10:09 } +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 396/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 3.642429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43645 samples/s/p 1:09:59 } +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 398/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 3.638845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43723 samples/s/p 1:09:56 } +2024-07-26 00:03:05,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 400/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6352626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:05,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43764 samples/s/p 1:09:52 } +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 402/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 3.6316828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:08,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43152 samples/s/p 1:09:54 } +2024-07-26 00:03:11,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 404/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 3.6281049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:11,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43470 samples/s/p 1:09:49 } +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 406/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 3.6245292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43281 samples/s/p 1:09:47 } +2024-07-26 00:03:17,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 408/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 3.6209553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:17,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43123 samples/s/p 1:09:46 } +2024-07-26 00:03:20,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 410/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6173842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:20,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.42869 samples/s/p 1:09:45 } +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 412/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 3.613815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43234 samples/s/p 1:09:39 } +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 414/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 3.6102506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43078 samples/s/p 1:09:37 } +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 416/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.606684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:29,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43251 samples/s/p 1:09:33 } +2024-07-26 00:03:32,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 418/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 3.6031215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:32,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43210 samples/s/p 1:09:30 } +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 420/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.5995631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43279 samples/s/p 1:09:27 } +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 422/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 3.5960024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:38,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43696 samples/s/p 1:09:21 } +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 424/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.5924495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:41,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43323 samples/s/p 1:09:21 } +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 426/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 3.5888947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:43,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43147 samples/s/p 1:09:19 } +2024-07-26 00:03:46,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 428/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.5853418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:46,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43620 samples/s/p 1:09:12 } +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 430/ 1625], loss: 1.095, per_step_time: 1473ms, lr: 3.5817948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:49,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43024 samples/s/p 1:09:14 } +2024-07-26 00:03:52,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 432/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 3.5782468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:52,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43831 samples/s/p 1:09:05 } +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 434/ 1625], loss: 1.134, per_step_time: 1473ms, lr: 3.5747025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42999 samples/s/p 1:09:08 } +2024-07-26 00:03:58,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 436/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.57116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:58,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43455 samples/s/p 1:09:02 } +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 438/ 1625], loss: 1.138, per_step_time: 1474ms, lr: 3.567619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:01,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42588 samples/s/p 1:09:06 } +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 440/ 1625], loss: 0.942, per_step_time: 1470ms, lr: 3.5640805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43851 samples/s/p 1:08:53 } +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 442/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 3.5605449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:07,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43094 samples/s/p 1:08:56 } +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 444/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.557011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43425 samples/s/p 1:08:50 } +2024-07-26 00:04:13,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 446/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 3.5534795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:13,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43148 samples/s/p 1:08:50 } +2024-07-26 00:04:16,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 448/ 1625], loss: 1.162, per_step_time: 1486ms, lr: 3.5499497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:16,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.38354 samples/s/p 1:09:23 } +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 450/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 3.5464218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43651 samples/s/p 1:08:40 } +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 452/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 3.5428975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43485 samples/s/p 1:08:38 } +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 454/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 3.5393746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43673 samples/s/p 1:08:34 } +2024-07-26 00:04:28,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 456/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.5358544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:28,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43664 samples/s/p 1:08:31 } +2024-07-26 00:04:31,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.532336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:31,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43384 samples/s/p 1:08:30 } +2024-07-26 00:04:34,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 460/ 1625], loss: 1.344, per_step_time: 1476ms, lr: 3.5288194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:34,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.41880 samples/s/p 1:08:38 } +2024-07-26 00:04:37,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 462/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 3.525307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43542 samples/s/p 1:08:23 } +2024-07-26 00:04:40,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 464/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.5217954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:40,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43290 samples/s/p 1:08:22 } +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 466/ 1625], loss: 1.228, per_step_time: 1474ms, lr: 3.5182838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.42393 samples/s/p 1:08:26 } +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 468/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.5147787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43811 samples/s/p 1:08:12 } +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 3.511273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43822 samples/s/p 1:08:09 } +2024-07-26 00:04:51,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 472/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 3.5077683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:51,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44318 samples/s/p 1:08:02 } +2024-07-26 00:04:54,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 474/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 3.50427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:54,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44430 samples/s/p 1:07:59 } +2024-07-26 00:04:57,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 476/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 3.5007715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:57,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43886 samples/s/p 1:08:00 } +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 478/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 3.4972754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43110 samples/s/p 1:08:03 } +2024-07-26 00:05:03,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 480/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 3.4937802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:03,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43540 samples/s/p 1:07:56 } +2024-07-26 00:05:06,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 482/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 3.4902887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:06,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43998 samples/s/p 1:07:50 } +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 484/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 3.4867994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:09,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43922 samples/s/p 1:07:48 } +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 486/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.4833124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:12,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43510 samples/s/p 1:07:48 } +2024-07-26 00:05:15,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 488/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 3.4798268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:15,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43329 samples/s/p 1:07:46 } +2024-07-26 00:05:18,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 490/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 3.4763439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:18,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43508 samples/s/p 1:07:42 } +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 492/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 3.4728632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43059 samples/s/p 1:07:42 } +2024-07-26 00:05:24,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 494/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 3.4693844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:24,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43675 samples/s/p 1:07:35 } +2024-07-26 00:05:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 496/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 3.4659074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:27,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43534 samples/s/p 1:07:33 } +2024-07-26 00:05:30,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 498/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 3.4624331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:30,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43135 samples/s/p 1:07:33 } +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 500/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 3.4589616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43972 samples/s/p 1:07:24 } +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 502/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 3.4554914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43056 samples/s/p 1:07:28 } +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 504/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 3.452024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42704 samples/s/p 1:07:27 } +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 506/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 3.448562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43550 samples/s/p 1:07:18 } +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 508/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 3.4450968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:45,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42889 samples/s/p 1:07:20 } +2024-07-26 00:05:47,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 510/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 3.4416348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:47,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43279 samples/s/p 1:07:14 } +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 512/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 3.4381792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42961 samples/s/p 1:07:14 } +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 514/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 3.4347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:53,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43402 samples/s/p 1:07:07 } +2024-07-26 00:05:56,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 516/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 3.431267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42578 samples/s/p 1:07:11 } +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 518/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 3.4278169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42838 samples/s/p 1:07:06 } +2024-07-26 00:06:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 520/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 3.4243667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:02,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43363 samples/s/p 1:06:59 } +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 522/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 3.4209197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:05,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43537 samples/s/p 1:06:55 } +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 524/ 1625], loss: 0.867, per_step_time: 1471ms, lr: 3.417474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43542 samples/s/p 1:06:52 } +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 526/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.4140307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:11,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43777 samples/s/p 1:06:47 } +2024-07-26 00:06:14,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 528/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.4105901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:14,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43637 samples/s/p 1:06:45 } +2024-07-26 00:06:17,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 530/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 3.4071522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:17,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43688 samples/s/p 1:06:42 } +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 532/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 3.4037148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43501 samples/s/p 1:06:40 } +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 534/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 3.400282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43797 samples/s/p 1:06:35 } +2024-07-26 00:06:26,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 536/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.39685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:26,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43522 samples/s/p 1:06:34 } +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 538/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.3934198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43785 samples/s/p 1:06:29 } +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 540/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.3899928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43646 samples/s/p 1:06:27 } +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 542/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 3.386568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.44234 samples/s/p 1:06:20 } +2024-07-26 00:06:38,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 544/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.3831452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43563 samples/s/p 1:06:22 } +2024-07-26 00:06:41,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 546/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 3.3797246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:41,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43341 samples/s/p 1:06:21 } +2024-07-26 00:06:44,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 548/ 1625], loss: 1.089, per_step_time: 1468ms, lr: 3.3763054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.44598 samples/s/p 1:06:09 } +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 550/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3728916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43363 samples/s/p 1:06:15 } +2024-07-26 00:06:49,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 552/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 3.369476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:49,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43243 samples/s/p 1:06:13 } +2024-07-26 00:06:52,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 554/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 3.366064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:52,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43736 samples/s/p 1:06:06 } +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 556/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 3.3626561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43565 samples/s/p 1:06:04 } +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 558/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3592482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43174 samples/s/p 1:06:04 } +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 560/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 3.3558422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:01,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43781 samples/s/p 1:05:57 } +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 562/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 3.3524425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43452 samples/s/p 1:05:56 } +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 564/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 3.3490414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43194 samples/s/p 1:05:55 } +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 566/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 3.345643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.42900 samples/s/p 1:05:55 } +2024-07-26 00:07:13,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 568/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 3.3422466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:13,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43412 samples/s/p 1:05:48 } +2024-07-26 00:07:16,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 570/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 3.3388533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:16,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.44011 samples/s/p 1:05:41 } +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 572/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.3354622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:19,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43412 samples/s/p 1:05:42 } +2024-07-26 00:07:22,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 574/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 3.3320725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:22,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43440 samples/s/p 1:05:39 } +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 576/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.3286851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43296 samples/s/p 1:05:37 } +2024-07-26 00:07:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 578/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.325301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43632 samples/s/p 1:05:32 } +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 580/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.321918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:31,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43346 samples/s/p 1:05:31 } +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 582/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 3.318538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:34,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.42944 samples/s/p 1:05:31 } +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 584/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.3151605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43322 samples/s/p 1:05:25 } +2024-07-26 00:07:40,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 586/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 3.3117835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:40,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43366 samples/s/p 1:05:22 } +2024-07-26 00:07:43,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 588/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 3.3084107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:43,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43689 samples/s/p 1:05:16 } +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 590/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 3.3050396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43154 samples/s/p 1:05:17 } +2024-07-26 00:07:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 592/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 3.3016709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.44002 samples/s/p 1:05:08 } +2024-07-26 00:07:51,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 594/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 3.2983044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:51,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43500 samples/s/p 1:05:09 } +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 596/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 3.2949383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43050 samples/s/p 1:05:09 } +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 598/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 3.2915755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43551 samples/s/p 1:05:03 } +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 600/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 3.2882176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:00,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43286 samples/s/p 1:05:02 } +2024-07-26 00:08:03,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 602/ 1625], loss: 1.340, per_step_time: 1470ms, lr: 3.2848575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:03,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.44124 samples/s/p 1:04:53 } +2024-07-26 00:08:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 604/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 3.281505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:06,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43759 samples/s/p 1:04:52 } +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 606/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 3.2781509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.42777 samples/s/p 1:04:56 } +2024-07-26 00:08:12,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 608/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 3.274798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:12,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43201 samples/s/p 1:04:51 } +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 610/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 3.271452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:15,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43918 samples/s/p 1:04:42 } +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 612/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.2681055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43757 samples/s/p 1:04:41 } +2024-07-26 00:08:21,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 614/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 3.2647613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:21,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43578 samples/s/p 1:04:39 } +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 616/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 3.2614184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43021 samples/s/p 1:04:40 } +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 618/ 1625], loss: 1.291, per_step_time: 1470ms, lr: 3.2580788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43967 samples/s/p 1:04:30 } +2024-07-26 00:08:30,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 620/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.2547418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:30,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43704 samples/s/p 1:04:29 } +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 622/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 3.2514067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43813 samples/s/p 1:04:26 } +2024-07-26 00:08:36,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 624/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 3.2480734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:36,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43797 samples/s/p 1:04:23 } +2024-07-26 00:08:39,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 626/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 3.2447433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:39,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.44163 samples/s/p 1:04:17 } +2024-07-26 00:08:42,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 628/ 1625], loss: 1.020, per_step_time: 1470ms, lr: 3.241415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:42,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43910 samples/s/p 1:04:16 } +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 630/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.2380885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:45,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43556 samples/s/p 1:04:16 } +2024-07-26 00:08:47,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 632/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.2347662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:47,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43016 samples/s/p 1:04:16 } +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 634/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 3.2314433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:50,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43038 samples/s/p 1:04:13 } +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 636/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 3.2281246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:53,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43505 samples/s/p 1:04:07 } +2024-07-26 00:08:56,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 638/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.224808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:56,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43654 samples/s/p 1:04:03 } +2024-07-26 00:08:59,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 640/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 3.221492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:59,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42954 samples/s/p 1:04:05 } +2024-07-26 00:09:02,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 642/ 1625], loss: 1.075, per_step_time: 1473ms, lr: 3.2181792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:02,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.42812 samples/s/p 1:04:03 } +2024-07-26 00:09:05,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 644/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 3.214871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:05,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43450 samples/s/p 1:03:56 } +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 646/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 3.2115609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43459 samples/s/p 1:03:53 } +2024-07-26 00:09:11,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 648/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.2082567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:11,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43735 samples/s/p 1:03:48 } +2024-07-26 00:09:14,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 650/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 3.2049534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:14,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43778 samples/s/p 1:03:45 } +2024-07-26 00:09:17,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 652/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 3.20165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:17,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.44261 samples/s/p 1:03:38 } +2024-07-26 00:09:20,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 654/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 3.1983536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:20,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43839 samples/s/p 1:03:38 } +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 656/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 3.1950567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:23,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43171 samples/s/p 1:03:40 } +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 658/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 3.1917602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43550 samples/s/p 1:03:34 } +2024-07-26 00:09:29,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 660/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.1884701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:29,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43443 samples/s/p 1:03:32 } +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 662/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 3.1851805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43726 samples/s/p 1:03:27 } +2024-07-26 00:09:35,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 664/ 1625], loss: 0.933, per_step_time: 1478ms, lr: 3.1818931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.40972 samples/s/p 1:03:44 } +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 666/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 3.1786071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:38,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43548 samples/s/p 1:03:23 } +2024-07-26 00:09:41,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 668/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 3.1753243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:41,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43066 samples/s/p 1:03:23 } +2024-07-26 00:09:44,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 670/ 1625], loss: 1.257, per_step_time: 1476ms, lr: 3.1720447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:44,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.41746 samples/s/p 1:03:29 } +2024-07-26 00:09:47,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 672/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 3.1687646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:47,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43613 samples/s/p 1:03:13 } +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 674/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 3.1654881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:49,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43470 samples/s/p 1:03:11 } +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 676/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 3.1622171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43055 samples/s/p 1:03:11 } +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 678/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 3.1589434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.44007 samples/s/p 1:03:02 } +2024-07-26 00:09:58,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 680/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.1556738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:58,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43773 samples/s/p 1:03:00 } +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 682/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 3.1524087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43250 samples/s/p 1:03:01 } +2024-07-26 00:10:04,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 684/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.1491418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:04,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43577 samples/s/p 1:02:56 } +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 686/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.1458799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43646 samples/s/p 1:02:53 } +2024-07-26 00:10:10,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 688/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.1426216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:10,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43391 samples/s/p 1:02:51 } +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 690/ 1625], loss: 1.115, per_step_time: 1469ms, lr: 3.1393615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.44350 samples/s/p 1:02:42 } +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 692/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 3.1361074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:16,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43630 samples/s/p 1:02:44 } +2024-07-26 00:10:19,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 694/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 3.1328536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:19,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43944 samples/s/p 1:02:39 } +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 696/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 3.1296004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43146 samples/s/p 1:02:41 } +2024-07-26 00:10:25,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 698/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.1263544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:25,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43586 samples/s/p 1:02:35 } +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 700/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.123107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43684 samples/s/p 1:02:32 } +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 702/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 3.119862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43590 samples/s/p 1:02:29 } +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 704/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 3.116621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43308 samples/s/p 1:02:28 } +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 706/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 3.1133818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43183 samples/s/p 1:02:26 } +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 708/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 3.110144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:40,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43998 samples/s/p 1:02:18 } +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 710/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 3.106909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:43,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.44107 samples/s/p 1:02:14 } +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 712/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 3.1036766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:46,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43331 samples/s/p 1:02:16 } +2024-07-26 00:10:49,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 714/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 3.100446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:49,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43140 samples/s/p 1:02:15 } +2024-07-26 00:10:51,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 716/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.0972174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:51,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43389 samples/s/p 1:02:10 } +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 718/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 3.093991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43608 samples/s/p 1:02:06 } +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 720/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.090769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:57,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43609 samples/s/p 1:02:03 } +2024-07-26 00:11:00,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 722/ 1625], loss: 1.131, per_step_time: 1474ms, lr: 3.0875462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:00,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.42599 samples/s/p 1:02:07 } +2024-07-26 00:11:03,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 724/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 3.0843275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:03,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43347 samples/s/p 1:01:59 } +2024-07-26 00:11:06,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 726/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 3.0811125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:06,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43765 samples/s/p 1:01:53 } +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 728/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 3.0778956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:09,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43234 samples/s/p 1:01:54 } +2024-07-26 00:11:12,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 730/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 3.0746833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43697 samples/s/p 1:01:47 } +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 732/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 3.071475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:15,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42993 samples/s/p 1:01:49 } +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 734/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 3.0682659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42686 samples/s/p 1:01:48 } +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 736/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 3.0650622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:21,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43011 samples/s/p 1:01:43 } +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 738/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 3.0618598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:24,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43694 samples/s/p 1:01:36 } +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 740/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.058657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43732 samples/s/p 1:01:32 } +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 742/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 3.0554602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43494 samples/s/p 1:01:31 } +2024-07-26 00:11:33,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 744/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.0522642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:33,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43577 samples/s/p 1:01:28 } +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 746/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 3.0490683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:36,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42923 samples/s/p 1:01:29 } +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 748/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 3.045879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:39,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43530 samples/s/p 1:01:22 } +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 750/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 3.042689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:42,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42941 samples/s/p 1:01:23 } +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 752/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 3.0395022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:45,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43852 samples/s/p 1:01:14 } +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 754/ 1625], loss: 1.324, per_step_time: 1471ms, lr: 3.0363185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43527 samples/s/p 1:01:13 } +2024-07-26 00:11:50,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 756/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 3.0331362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:50,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44155 samples/s/p 1:01:06 } +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 758/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 3.0299557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:53,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43201 samples/s/p 1:01:10 } +2024-07-26 00:11:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 760/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 3.026778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42915 samples/s/p 1:01:09 } +2024-07-26 00:11:59,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 762/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 3.0236024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:59,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43322 samples/s/p 1:01:03 } +2024-07-26 00:12:02,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 764/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 3.0204305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:02,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42890 samples/s/p 1:01:03 } +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 766/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 3.0172578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:05,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44076 samples/s/p 1:00:52 } +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 768/ 1625], loss: 1.183, per_step_time: 1468ms, lr: 3.0140895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44654 samples/s/p 1:00:45 } +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 770/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 3.0109254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43350 samples/s/p 1:00:51 } +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 772/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 3.0077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44052 samples/s/p 1:00:43 } +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 774/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 3.004599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43645 samples/s/p 1:00:43 } +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 776/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.0014398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:20,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43967 samples/s/p 1:00:38 } +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 778/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9982812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43426 samples/s/p 1:00:39 } +2024-07-26 00:12:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 780/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.9951293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:26,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44074 samples/s/p 1:00:31 } +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 782/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.9919756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43561 samples/s/p 1:00:32 } +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 784/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.9888242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43347 samples/s/p 1:00:30 } +2024-07-26 00:12:35,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 786/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9856783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:35,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43799 samples/s/p 1:00:24 } +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 788/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9825324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43400 samples/s/p 1:00:24 } +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 790/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9793891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:41,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43297 samples/s/p 1:00:22 } +2024-07-26 00:12:44,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 792/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9762482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:44,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43863 samples/s/p 1:00:15 } +2024-07-26 00:12:47,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 794/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.97311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:47,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43220 samples/s/p 1:00:16 } +2024-07-26 00:12:50,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 796/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.9699736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:50,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43084 samples/s/p 1:00:14 } +2024-07-26 00:12:52,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 798/ 1625], loss: 1.240, per_step_time: 1469ms, lr: 2.96684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:52,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.44260 samples/s/p 1:00:04 } +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 800/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43424 samples/s/p 1:00:06 } +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 802/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.960579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:58,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43445 samples/s/p 1:00:03 } +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 804/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9574521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43375 samples/s/p 1:00:01 } +2024-07-26 00:13:04,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 806/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.954328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:04,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42823 samples/s/p 1:00:01 } +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 808/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 2.9512053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43058 samples/s/p 0:59:57 } +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 810/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.9480843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:10,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.44169 samples/s/p 0:59:47 } +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 812/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.944967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43535 samples/s/p 0:59:48 } +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 814/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.941853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:16,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42769 samples/s/p 0:59:50 } +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 816/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9387393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43310 samples/s/p 0:59:43 } +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9356302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43332 samples/s/p 0:59:40 } +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 820/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9325206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43313 samples/s/p 0:59:38 } +2024-07-26 00:13:28,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 822/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.9294138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:28,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43325 samples/s/p 0:59:35 } +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 824/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.926312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43218 samples/s/p 0:59:32 } +2024-07-26 00:13:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 826/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.9232092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:34,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43393 samples/s/p 0:59:28 } +2024-07-26 00:13:37,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 828/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 2.9201092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:37,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43178 samples/s/p 0:59:27 } +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 830/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.9170133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43374 samples/s/p 0:59:22 } +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 832/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.91392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43315 samples/s/p 0:59:20 } +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 834/ 1625], loss: 1.292, per_step_time: 1470ms, lr: 2.9108269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43874 samples/s/p 0:59:13 } +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 836/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9077378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43988 samples/s/p 0:59:10 } +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 838/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.9046491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43875 samples/s/p 0:59:07 } +2024-07-26 00:13:54,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 840/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9015653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:54,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43570 samples/s/p 0:59:06 } +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 842/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.8984814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:57,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43759 samples/s/p 0:59:02 } +2024-07-26 00:14:00,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 844/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 2.8954005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43099 samples/s/p 0:59:04 } +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 846/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.8923228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:03,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43673 samples/s/p 0:58:57 } +2024-07-26 00:14:06,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 848/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.8892468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:06,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43804 samples/s/p 0:58:53 } +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 850/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8861737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:09,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43745 samples/s/p 0:58:51 } +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 852/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.8831018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.42991 samples/s/p 0:58:53 } +2024-07-26 00:14:15,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 854/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8800328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:15,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43204 samples/s/p 0:58:48 } +2024-07-26 00:14:18,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 856/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.8769664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:18,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43112 samples/s/p 0:58:46 } +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 858/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.8739028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:21,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43862 samples/s/p 0:58:38 } +2024-07-26 00:14:24,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 860/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.8708405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:24,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43802 samples/s/p 0:58:35 } +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 862/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 2.8677819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:27,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43504 samples/s/p 0:58:34 } +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 864/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.864725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43589 samples/s/p 0:58:31 } +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 866/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.861669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:33,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43557 samples/s/p 0:58:28 } +2024-07-26 00:14:36,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 868/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.8586173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:36,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43299 samples/s/p 0:58:27 } +2024-07-26 00:14:39,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 870/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 2.8555673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:39,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43726 samples/s/p 0:58:21 } +2024-07-26 00:14:42,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 872/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.8525174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:42,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43441 samples/s/p 0:58:20 } +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 874/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 2.8494742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.44408 samples/s/p 0:58:11 } +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.846431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43532 samples/s/p 0:58:14 } +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 878/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8433897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43631 samples/s/p 0:58:10 } +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 880/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.840351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:53,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43241 samples/s/p 0:58:10 } +2024-07-26 00:14:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 882/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8373138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43829 samples/s/p 0:58:03 } +2024-07-26 00:14:59,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 884/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.834281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:59,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43619 samples/s/p 0:58:01 } +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 886/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.8312493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43667 samples/s/p 0:57:58 } +2024-07-26 00:15:05,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 888/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.8282202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:05,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43965 samples/s/p 0:57:53 } +2024-07-26 00:15:08,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 890/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.8251925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:08,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43191 samples/s/p 0:57:55 } +2024-07-26 00:15:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 892/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.8221684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:11,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43709 samples/s/p 0:57:49 } +2024-07-26 00:15:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 894/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.8191462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:14,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44031 samples/s/p 0:57:44 } +2024-07-26 00:15:17,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 896/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.8161264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43823 samples/s/p 0:57:42 } +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 898/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 2.8131085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44214 samples/s/p 0:57:37 } +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 900/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.810094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43108 samples/s/p 0:57:41 } +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.8070801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43145 samples/s/p 0:57:38 } +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 904/ 1625], loss: 0.917, per_step_time: 1471ms, lr: 2.8040708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43660 samples/s/p 0:57:32 } +2024-07-26 00:15:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 906/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.801064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:32,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43640 samples/s/p 0:57:29 } +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 908/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.7980554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43779 samples/s/p 0:57:25 } +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 910/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.795052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43459 samples/s/p 0:57:24 } +2024-07-26 00:15:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 912/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.7920532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.42869 samples/s/p 0:57:25 } +2024-07-26 00:15:44,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 914/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.7890542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43252 samples/s/p 0:57:20 } +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 916/ 1625], loss: 0.870, per_step_time: 1472ms, lr: 2.7860576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43250 samples/s/p 0:57:17 } +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 918/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7830638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43637 samples/s/p 0:57:11 } +2024-07-26 00:15:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 920/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7800718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43577 samples/s/p 0:57:09 } +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 922/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.7770823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43540 samples/s/p 0:57:06 } +2024-07-26 00:15:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 924/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 2.7740953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:58,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43251 samples/s/p 0:57:05 } +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 926/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.771111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43429 samples/s/p 0:57:01 } +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 928/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.7681276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43327 samples/s/p 0:56:58 } +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 930/ 1625], loss: 0.997, per_step_time: 1472ms, lr: 2.7651486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43459 samples/s/p 0:56:55 } +2024-07-26 00:16:10,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 932/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7621702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:10,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43827 samples/s/p 0:56:49 } +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 934/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.7591964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.42995 samples/s/p 0:56:52 } +2024-07-26 00:16:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 936/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.7562223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43252 samples/s/p 0:56:47 } +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 938/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.7532528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43881 samples/s/p 0:56:40 } +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 940/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.750283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43479 samples/s/p 0:56:40 } +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 942/ 1625], loss: 1.108, per_step_time: 1475ms, lr: 2.747317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:25,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.42160 samples/s/p 0:56:45 } +2024-07-26 00:16:28,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 944/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.744356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:28,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43305 samples/s/p 0:56:35 } +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 946/ 1625], loss: 0.959, per_step_time: 1470ms, lr: 2.7413932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44003 samples/s/p 0:56:28 } +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 948/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 2.738434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:34,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43739 samples/s/p 0:56:26 } +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 950/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.735479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44147 samples/s/p 0:56:21 } +2024-07-26 00:16:40,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 952/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.732524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43346 samples/s/p 0:56:23 } +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 954/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7295719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:43,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43386 samples/s/p 0:56:20 } +2024-07-26 00:16:46,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 956/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7266237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:46,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43440 samples/s/p 0:56:17 } +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 958/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.7236756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:49,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43188 samples/s/p 0:56:15 } +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 960/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.720732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:51,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43118 samples/s/p 0:56:13 } +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 962/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.7177894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:54,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43806 samples/s/p 0:56:05 } +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 964/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.714848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43634 samples/s/p 0:56:04 } +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 966/ 1625], loss: 1.189, per_step_time: 1469ms, lr: 2.7119122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.44235 samples/s/p 0:55:57 } +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 968/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.7089773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43273 samples/s/p 0:56:00 } +2024-07-26 00:17:06,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 970/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.7060437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:06,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43525 samples/s/p 0:55:55 } +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 972/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.703113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43092 samples/s/p 0:55:55 } +2024-07-26 00:17:12,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 974/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.700185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:12,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43776 samples/s/p 0:55:48 } +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 976/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.6972593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:15,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43359 samples/s/p 0:55:48 } +2024-07-26 00:17:18,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6943355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:18,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43274 samples/s/p 0:55:45 } +2024-07-26 00:17:21,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 980/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 2.6914145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:21,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.42901 samples/s/p 0:55:44 } +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 982/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.6884966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43874 samples/s/p 0:55:36 } +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 984/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.6855796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:27,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43596 samples/s/p 0:55:34 } +2024-07-26 00:17:30,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 986/ 1625], loss: 1.115, per_step_time: 1474ms, lr: 2.6826654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:30,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42694 samples/s/p 0:55:37 } +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 988/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.679756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42706 samples/s/p 0:55:34 } +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 990/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.6768446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:36,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43357 samples/s/p 0:55:27 } +2024-07-26 00:17:39,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 992/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.673938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:39,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43757 samples/s/p 0:55:22 } +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 994/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.671035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:42,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43670 samples/s/p 0:55:19 } +2024-07-26 00:17:45,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 996/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.668131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:45,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42760 samples/s/p 0:55:22 } +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 998/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.6652315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43787 samples/s/p 0:55:13 } +2024-07-26 00:17:51,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1000/ 1625], loss: 1.319, per_step_time: 1469ms, lr: 2.662336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44291 samples/s/p 0:55:07 } +2024-07-26 00:17:51,015 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1002/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 2.659439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43311 samples/s/p 0:55:10 } +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1004/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.656548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.42591 samples/s/p 0:55:11 } +2024-07-26 00:18:32,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1006/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.653658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:32,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44485 samples/s/p 0:54:57 } +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1008/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.6507678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43765 samples/s/p 0:54:58 } +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1010/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.6478838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43282 samples/s/p 0:54:58 } +2024-07-26 00:18:41,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1012/ 1625], loss: 0.992, per_step_time: 1471ms, lr: 2.6450007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:41,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43609 samples/s/p 0:54:53 } +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1014/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.6421183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43770 samples/s/p 0:54:49 } +2024-07-26 00:18:47,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1016/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.639241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:47,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43393 samples/s/p 0:54:48 } +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1018/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.6363648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44067 samples/s/p 0:54:41 } +2024-07-26 00:18:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1020/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.633492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43612 samples/s/p 0:54:41 } +2024-07-26 00:18:56,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1022/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 2.6306209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:56,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44000 samples/s/p 0:54:36 } +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1024/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.6277507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43281 samples/s/p 0:54:37 } +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1026/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6248856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43644 samples/s/p 0:54:32 } +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1028/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6220205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:05,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43382 samples/s/p 0:54:31 } +2024-07-26 00:19:08,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1030/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.619159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:08,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43599 samples/s/p 0:54:27 } +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1032/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.616301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43199 samples/s/p 0:54:26 } +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1034/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.613442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43160 samples/s/p 0:54:23 } +2024-07-26 00:19:17,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1036/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.6105872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:17,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43336 samples/s/p 0:54:19 } +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1038/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.6077369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:20,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43460 samples/s/p 0:54:16 } +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1040/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.6048856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:23,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43147 samples/s/p 0:54:15 } +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1042/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.6020389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:26,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43285 samples/s/p 0:54:11 } +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1044/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5991944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:29,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43708 samples/s/p 0:54:05 } +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1046/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.44071 samples/s/p 0:54:00 } +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1048/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.593511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43268 samples/s/p 0:54:02 } +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1050/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 2.590673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:37,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43752 samples/s/p 0:53:56 } +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1052/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.5878362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:40,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.42936 samples/s/p 0:53:58 } +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1054/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.585004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:43,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43150 samples/s/p 0:53:54 } +2024-07-26 00:19:46,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1056/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.5821737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43484 samples/s/p 0:53:49 } +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1058/ 1625], loss: 1.155, per_step_time: 1478ms, lr: 2.5793431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.41132 samples/s/p 0:54:00 } +2024-07-26 00:19:52,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1060/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 2.5765178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:52,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43212 samples/s/p 0:53:45 } +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1062/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 2.573695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43968 samples/s/p 0:53:37 } +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1064/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5708741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43463 samples/s/p 0:53:37 } +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1066/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.568054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43372 samples/s/p 0:53:35 } +2024-07-26 00:20:04,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1068/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.5652375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:04,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.42706 samples/s/p 0:53:36 } +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1070/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 2.5624233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43365 samples/s/p 0:53:29 } +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1072/ 1625], loss: 1.112, per_step_time: 1477ms, lr: 2.5596119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.41489 samples/s/p 0:53:37 } +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1074/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.556802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43650 samples/s/p 0:53:22 } +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1076/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.5539966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43251 samples/s/p 0:53:21 } +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1078/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.5511913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43884 samples/s/p 0:53:14 } +2024-07-26 00:20:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1080/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5483885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:22,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43368 samples/s/p 0:53:14 } +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1082/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.54559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:25,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42980 samples/s/p 0:53:14 } +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1084/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.5427914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44271 samples/s/p 0:53:03 } +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1086/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.5399972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:31,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43074 samples/s/p 0:53:07 } +2024-07-26 00:20:33,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1088/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.5372049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:33,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43208 samples/s/p 0:53:04 } +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1090/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 2.5344134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44149 samples/s/p 0:52:55 } +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1092/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.5316276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43806 samples/s/p 0:52:54 } +2024-07-26 00:20:42,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1094/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.5288423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:42,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43422 samples/s/p 0:52:53 } +2024-07-26 00:20:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1096/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 2.5260574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:45,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.41851 samples/s/p 0:53:00 } +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1098/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.523278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43238 samples/s/p 0:52:49 } +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1100/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 2.5204995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43059 samples/s/p 0:52:47 } +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1102/ 1625], loss: 1.340, per_step_time: 1473ms, lr: 2.5177233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42850 samples/s/p 0:52:45 } +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1104/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 2.514951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43513 samples/s/p 0:52:38 } +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.512179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:00,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43412 samples/s/p 0:52:36 } +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1108/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.50941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43022 samples/s/p 0:52:35 } +2024-07-26 00:21:06,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1110/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.5066433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43157 samples/s/p 0:52:31 } +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1112/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 2.5038803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.44385 samples/s/p 0:52:21 } +2024-07-26 00:21:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1114/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 2.501119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:12,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43535 samples/s/p 0:52:23 } +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1116/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.4983597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43437 samples/s/p 0:52:21 } +2024-07-26 00:21:18,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1118/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.4956034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:18,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42909 samples/s/p 0:52:21 } +2024-07-26 00:21:21,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1120/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.49285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:21,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43176 samples/s/p 0:52:17 } +2024-07-26 00:21:24,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1122/ 1625], loss: 1.030, per_step_time: 1473ms, lr: 2.4900962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:24,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42778 samples/s/p 0:52:16 } +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1124/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.487347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:27,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43162 samples/s/p 0:52:11 } +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1126/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.4846013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43152 samples/s/p 0:52:08 } +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1128/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.4818555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43883 samples/s/p 0:52:01 } +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1130/ 1625], loss: 1.253, per_step_time: 1474ms, lr: 2.4791148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.42730 samples/s/p 0:52:04 } +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1132/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.4763742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43787 samples/s/p 0:51:55 } +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1134/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.4736355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:41,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43061 samples/s/p 0:51:57 } +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1136/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.4709016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43137 samples/s/p 0:51:53 } +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1138/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.468169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43318 samples/s/p 0:51:49 } +2024-07-26 00:21:50,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1140/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.4654378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:50,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43168 samples/s/p 0:51:47 } +2024-07-26 00:21:53,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1142/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 2.462711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:53,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43226 samples/s/p 0:51:44 } +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1144/ 1625], loss: 0.891, per_step_time: 1471ms, lr: 2.4599851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:56,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43761 samples/s/p 0:51:38 } +2024-07-26 00:21:59,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1146/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.4572619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:59,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43416 samples/s/p 0:51:37 } +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1148/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.454542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43107 samples/s/p 0:51:36 } +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1150/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.451823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:05,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43945 samples/s/p 0:51:28 } +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1152/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.4491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:08,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43803 samples/s/p 0:51:26 } +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1154/ 1625], loss: 1.103, per_step_time: 1474ms, lr: 2.4463939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:11,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42606 samples/s/p 0:51:30 } +2024-07-26 00:22:14,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1156/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.4436843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:14,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43988 samples/s/p 0:51:19 } +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1158/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.4409746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43573 samples/s/p 0:51:18 } +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1160/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.438269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43338 samples/s/p 0:51:17 } +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1162/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.4355654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43504 samples/s/p 0:51:13 } +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1164/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.4328629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43445 samples/s/p 0:51:10 } +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1166/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4301635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:29,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43425 samples/s/p 0:51:07 } +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1168/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.427468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.42510 samples/s/p 0:51:10 } +2024-07-26 00:22:34,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1170/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.424775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:34,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43918 samples/s/p 0:50:59 } +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1172/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.4220817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:37,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43360 samples/s/p 0:50:59 } +2024-07-26 00:22:40,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1174/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 2.4193941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43933 samples/s/p 0:50:53 } +2024-07-26 00:22:43,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1176/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.416707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:43,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.44120 samples/s/p 0:50:49 } +2024-07-26 00:22:46,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1178/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.4140209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:46,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43333 samples/s/p 0:50:50 } +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1180/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.41134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:49,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43721 samples/s/p 0:50:45 } +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1182/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4086607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.44078 samples/s/p 0:50:40 } +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1184/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.4059823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43474 samples/s/p 0:50:41 } +2024-07-26 00:22:58,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1186/ 1625], loss: 1.133, per_step_time: 1475ms, lr: 2.4033093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:58,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.42305 samples/s/p 0:50:44 } +2024-07-26 00:23:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1188/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.4006358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:01,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43650 samples/s/p 0:50:34 } +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1190/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.3979662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43051 samples/s/p 0:50:34 } +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1192/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.3952991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:07,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43651 samples/s/p 0:50:28 } +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1194/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.3926336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43761 samples/s/p 0:50:24 } +2024-07-26 00:23:13,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1196/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 2.3899709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:13,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43414 samples/s/p 0:50:23 } +2024-07-26 00:23:16,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1198/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.38731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:16,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43451 samples/s/p 0:50:20 } +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1200/ 1625], loss: 1.066, per_step_time: 1484ms, lr: 2.3846521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.38824 samples/s/p 0:50:43 } +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1202/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3819962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43295 samples/s/p 0:50:15 } +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1204/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.3793439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:25,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.44004 samples/s/p 0:50:08 } +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1206/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.3766931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:28,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43697 samples/s/p 0:50:07 } +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1208/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 2.374045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:31,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43584 samples/s/p 0:50:05 } +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1210/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3713997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43221 samples/s/p 0:50:04 } +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1212/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3687567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43822 samples/s/p 0:49:58 } +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1214/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.3661146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43101 samples/s/p 0:49:59 } +2024-07-26 00:23:42,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1216/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.363476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:42,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43428 samples/s/p 0:49:54 } +2024-07-26 00:23:45,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1218/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3608425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43285 samples/s/p 0:49:52 } +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1220/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 2.3582083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43031 samples/s/p 0:49:50 } +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1222/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.3555756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43837 samples/s/p 0:49:43 } +2024-07-26 00:23:54,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1224/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.3529483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:54,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43341 samples/s/p 0:49:43 } +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1226/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 2.3503226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.42843 samples/s/p 0:49:42 } +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1228/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 2.3476969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.42970 samples/s/p 0:49:39 } +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1230/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3450757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43083 samples/s/p 0:49:35 } +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1232/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.3424568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43480 samples/s/p 0:49:30 } +2024-07-26 00:24:09,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1234/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.3398406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44157 samples/s/p 0:49:23 } +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1236/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.3372272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44033 samples/s/p 0:49:21 } +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1238/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.3346147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:15,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43822 samples/s/p 0:49:19 } +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1240/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 2.3320054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43383 samples/s/p 0:49:19 } +2024-07-26 00:24:21,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.3293978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:21,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.42993 samples/s/p 0:49:18 } +2024-07-26 00:24:24,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1244/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.326794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43304 samples/s/p 0:49:13 } +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1246/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.3241914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43623 samples/s/p 0:49:09 } +2024-07-26 00:24:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1248/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.3215916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42610 samples/s/p 0:49:11 } +2024-07-26 00:24:33,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1250/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.3189946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43162 samples/s/p 0:49:05 } +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1252/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.3164002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43251 samples/s/p 0:49:02 } +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1254/ 1625], loss: 1.057, per_step_time: 1472ms, lr: 2.3138073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43458 samples/s/p 0:48:58 } +2024-07-26 00:24:41,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1256/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 2.3112189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:41,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42773 samples/s/p 0:48:58 } +2024-07-26 00:24:44,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1258/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 2.3086304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:44,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43267 samples/s/p 0:48:53 } +2024-07-26 00:24:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1260/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.3060452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44060 samples/s/p 0:48:46 } +2024-07-26 00:24:50,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1262/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 2.3034638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:50,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.42764 samples/s/p 0:48:50 } +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1264/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3008822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:53,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43361 samples/s/p 0:48:44 } +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1266/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.298304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43774 samples/s/p 0:48:38 } +2024-07-26 00:24:59,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1268/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.295731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:59,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43523 samples/s/p 0:48:37 } +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1270/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 2.2931574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:02,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43868 samples/s/p 0:48:32 } +2024-07-26 00:25:05,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1272/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 2.290587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44435 samples/s/p 0:48:26 } +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1274/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.2880185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43780 samples/s/p 0:48:27 } +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1276/ 1625], loss: 1.382, per_step_time: 1473ms, lr: 2.2854533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42980 samples/s/p 0:48:28 } +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1278/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.2828908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:14,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43441 samples/s/p 0:48:22 } +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1280/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 2.28033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44458 samples/s/p 0:48:14 } +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1282/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2777717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:20,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43916 samples/s/p 0:48:14 } +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1284/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.275216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43770 samples/s/p 0:48:12 } +2024-07-26 00:25:26,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1286/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 2.2726622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42757 samples/s/p 0:48:14 } +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1288/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2701108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43632 samples/s/p 0:48:07 } +2024-07-26 00:25:32,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1290/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.267563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:32,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43787 samples/s/p 0:48:03 } +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1292/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.265017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:35,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43714 samples/s/p 0:48:00 } +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1294/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.2624724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:37,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43482 samples/s/p 0:47:59 } +2024-07-26 00:25:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1296/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.2599315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:40,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.42578 samples/s/p 0:48:01 } +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1298/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 2.2573931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:43,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43654 samples/s/p 0:47:52 } +2024-07-26 00:25:46,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1300/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.254859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:46,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43439 samples/s/p 0:47:50 } +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1302/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.2523225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:49,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43118 samples/s/p 0:47:49 } +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1304/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.2497911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43590 samples/s/p 0:47:43 } +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1306/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.2472648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43290 samples/s/p 0:47:42 } +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1308/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.244736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43963 samples/s/p 0:47:36 } +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1310/ 1625], loss: 1.267, per_step_time: 1475ms, lr: 2.2422114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42179 samples/s/p 0:47:42 } +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1312/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.239692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43104 samples/s/p 0:47:34 } +2024-07-26 00:26:07,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1314/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.237171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:07,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43383 samples/s/p 0:47:30 } +2024-07-26 00:26:10,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1316/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 2.234656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:10,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42433 samples/s/p 0:47:32 } +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1318/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.2321428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43336 samples/s/p 0:47:24 } +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1320/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 2.2296304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43264 samples/s/p 0:47:22 } +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1322/ 1625], loss: 1.075, per_step_time: 1474ms, lr: 2.2271213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42398 samples/s/p 0:47:23 } +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1324/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.224614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43166 samples/s/p 0:47:16 } +2024-07-26 00:26:25,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1326/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.2221093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:25,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42952 samples/s/p 0:47:14 } +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1328/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.2196073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43168 samples/s/p 0:47:10 } +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1330/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.217108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42616 samples/s/p 0:47:10 } +2024-07-26 00:26:34,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.21461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:34,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43497 samples/s/p 0:47:03 } +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1334/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 2.2121158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:37,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43736 samples/s/p 0:46:59 } +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1336/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2096242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43521 samples/s/p 0:46:57 } +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1338/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.2071342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:42,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43455 samples/s/p 0:46:54 } +2024-07-26 00:26:45,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1340/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.204648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:45,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43386 samples/s/p 0:46:51 } +2024-07-26 00:26:48,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1342/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.2021622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:48,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43887 samples/s/p 0:46:46 } +2024-07-26 00:26:51,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1344/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.1996816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:51,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43034 samples/s/p 0:46:47 } +2024-07-26 00:26:54,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1346/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.1971996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:54,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43477 samples/s/p 0:46:42 } +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1348/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 2.1947226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43388 samples/s/p 0:46:40 } +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1350/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.192249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:00,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43405 samples/s/p 0:46:37 } +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1352/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.1897754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43690 samples/s/p 0:46:32 } +2024-07-26 00:27:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1354/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.1873045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43594 samples/s/p 0:46:30 } +2024-07-26 00:27:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1356/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.1848386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:09,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43506 samples/s/p 0:46:27 } +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1358/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 2.182372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43937 samples/s/p 0:46:22 } +2024-07-26 00:27:15,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1360/ 1625], loss: 1.318, per_step_time: 1469ms, lr: 2.1799106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.44247 samples/s/p 0:46:18 } +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1362/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.1774501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43402 samples/s/p 0:46:19 } +2024-07-26 00:27:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1364/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 2.1749913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:21,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43404 samples/s/p 0:46:16 } +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1366/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1725377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43437 samples/s/p 0:46:13 } +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1368/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.1700848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:27,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43043 samples/s/p 0:46:12 } +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1370/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.1676337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43076 samples/s/p 0:46:09 } +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1372/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.1651854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43845 samples/s/p 0:46:02 } +2024-07-26 00:27:36,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1374/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1627402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:36,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43830 samples/s/p 0:45:59 } +2024-07-26 00:27:39,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1376/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.160297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:39,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43447 samples/s/p 0:45:58 } +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1378/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.1578562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43397 samples/s/p 0:45:55 } +2024-07-26 00:27:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1380/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.1554192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43255 samples/s/p 0:45:53 } +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1382/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.1529827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:47,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43511 samples/s/p 0:45:49 } +2024-07-26 00:27:50,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1384/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.1505498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:50,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43231 samples/s/p 0:45:48 } +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1386/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.1481196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.42982 samples/s/p 0:45:46 } +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1388/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.1456926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43488 samples/s/p 0:45:40 } +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1390/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.1432647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.44217 samples/s/p 0:45:34 } +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1392/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.1408423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43232 samples/s/p 0:45:36 } +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1394/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.1384217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43691 samples/s/p 0:45:30 } +2024-07-26 00:28:08,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1396/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1360033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:08,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43040 samples/s/p 0:45:31 } +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1398/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1335868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43764 samples/s/p 0:45:24 } +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1400/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1311748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43632 samples/s/p 0:45:22 } +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1402/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.1287624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43767 samples/s/p 0:45:18 } +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1404/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1263554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.42915 samples/s/p 0:45:20 } +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1406/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.1239493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43622 samples/s/p 0:45:13 } +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1408/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.1215442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43494 samples/s/p 0:45:11 } +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1410/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.119145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43758 samples/s/p 0:45:07 } +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1412/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.1167457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43407 samples/s/p 0:45:05 } +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1414/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.1143492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43484 samples/s/p 0:45:02 } +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1416/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 2.111955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43626 samples/s/p 0:44:58 } +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1418/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.1095645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43693 samples/s/p 0:44:55 } +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1420/ 1625], loss: 1.351, per_step_time: 1470ms, lr: 2.1071755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43957 samples/s/p 0:44:51 } +2024-07-26 00:28:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1422/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1047895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43590 samples/s/p 0:44:50 } +2024-07-26 00:28:49,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1424/ 1625], loss: 0.926, per_step_time: 1470ms, lr: 2.1024048e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:49,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43854 samples/s/p 0:44:46 } +2024-07-26 00:28:52,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1426/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.1000246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:52,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43676 samples/s/p 0:44:43 } +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1428/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.0976454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.42806 samples/s/p 0:44:45 } +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1430/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.0952687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:58,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.44058 samples/s/p 0:44:36 } +2024-07-26 00:29:01,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1432/ 1625], loss: 0.986, per_step_time: 1472ms, lr: 2.0928962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:01,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43272 samples/s/p 0:44:37 } +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1434/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.0905238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43685 samples/s/p 0:44:32 } +2024-07-26 00:29:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1436/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.088154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:07,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43397 samples/s/p 0:44:30 } +2024-07-26 00:29:10,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1438/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.0857894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:10,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43493 samples/s/p 0:44:27 } +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1440/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.0834239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43367 samples/s/p 0:44:24 } +2024-07-26 00:29:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1442/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.0810635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43762 samples/s/p 0:44:19 } +2024-07-26 00:29:19,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1444/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.0787043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:19,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43302 samples/s/p 0:44:19 } +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1446/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.0763464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43547 samples/s/p 0:44:15 } +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1448/ 1625], loss: 0.923, per_step_time: 1472ms, lr: 2.073995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43132 samples/s/p 0:44:14 } +2024-07-26 00:29:28,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1450/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.0716423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:28,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43186 samples/s/p 0:44:11 } +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1452/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.0692923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43746 samples/s/p 0:44:05 } +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1454/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 2.0669459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43288 samples/s/p 0:44:04 } +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1456/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 2.0646019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43215 samples/s/p 0:44:02 } +2024-07-26 00:29:40,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1458/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.0622606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:40,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43063 samples/s/p 0:43:59 } +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1460/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.059921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43614 samples/s/p 0:43:54 } +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1462/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 2.0575849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43920 samples/s/p 0:43:49 } +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1464/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.0552507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43424 samples/s/p 0:43:49 } +2024-07-26 00:29:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1466/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.0529178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.42825 samples/s/p 0:43:49 } +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1468/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.0505895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43179 samples/s/p 0:43:44 } +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1470/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.048264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43095 samples/s/p 0:43:42 } +2024-07-26 00:30:00,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1472/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.045938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:00,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42987 samples/s/p 0:43:39 } +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1474/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.0436166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:03,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42982 samples/s/p 0:43:36 } +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1476/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.0412986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43037 samples/s/p 0:43:33 } +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1478/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 2.0389798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:09,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44107 samples/s/p 0:43:25 } +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1480/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.0366654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43792 samples/s/p 0:43:23 } +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.034355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44144 samples/s/p 0:43:19 } +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1484/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.032044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43948 samples/s/p 0:43:17 } +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1486/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0297382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44161 samples/s/p 0:43:13 } +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1488/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.0274342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:24,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43463 samples/s/p 0:43:13 } +2024-07-26 00:30:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1490/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.025131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43986 samples/s/p 0:43:08 } +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1492/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.0228326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43610 samples/s/p 0:43:07 } +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1494/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0205355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43608 samples/s/p 0:43:04 } +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1496/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 2.0182401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.44404 samples/s/p 0:42:57 } +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1498/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.0159487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43716 samples/s/p 0:42:57 } +2024-07-26 00:30:41,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1500/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.0136595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:41,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43711 samples/s/p 0:42:54 } +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1502/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0113716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43434 samples/s/p 0:42:53 } +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1504/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.0090874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43982 samples/s/p 0:42:47 } +2024-07-26 00:30:50,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1506/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.0068057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:50,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43899 samples/s/p 0:42:45 } +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1508/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.0045259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43806 samples/s/p 0:42:42 } +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1510/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.0022485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43942 samples/s/p 0:42:39 } +2024-07-26 00:30:59,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1512/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.9999738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:59,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43592 samples/s/p 0:42:37 } +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1514/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.9977024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:02,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43751 samples/s/p 0:42:34 } +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1516/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 1.9954318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:05,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43890 samples/s/p 0:42:30 } +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1518/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.9931658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:08,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43176 samples/s/p 0:42:30 } +2024-07-26 00:31:11,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1520/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.9909023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:11,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44020 samples/s/p 0:42:24 } +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1522/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.988638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43609 samples/s/p 0:42:23 } +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1524/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9863796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44140 samples/s/p 0:42:17 } +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1526/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9841232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44106 samples/s/p 0:42:14 } +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1528/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.9818672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:23,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43546 samples/s/p 0:42:14 } +2024-07-26 00:31:26,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1530/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9796166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:26,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43822 samples/s/p 0:42:10 } +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1532/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.977366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43410 samples/s/p 0:42:09 } +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1534/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.9751183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.42809 samples/s/p 0:42:09 } +2024-07-26 00:31:35,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1536/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.9728745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:35,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43666 samples/s/p 0:42:02 } +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1538/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.9706317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43319 samples/s/p 0:42:00 } +2024-07-26 00:31:40,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1540/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.9683916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:40,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43310 samples/s/p 0:41:57 } +2024-07-26 00:31:43,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1542/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.9661557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:43,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43197 samples/s/p 0:41:55 } +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1544/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.9639208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.42927 samples/s/p 0:41:53 } +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1546/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.9616884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:49,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43206 samples/s/p 0:41:49 } +2024-07-26 00:31:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1548/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.9594595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.44189 samples/s/p 0:41:42 } +2024-07-26 00:31:55,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1550/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 1.9572321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:55,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43624 samples/s/p 0:41:41 } +2024-07-26 00:31:58,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1552/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.9550075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:58,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43160 samples/s/p 0:41:40 } +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1554/ 1625], loss: 0.970, per_step_time: 1471ms, lr: 1.9527856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43810 samples/s/p 0:41:34 } +2024-07-26 00:32:04,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1556/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9505653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:04,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43515 samples/s/p 0:41:33 } +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1558/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.9483475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43744 samples/s/p 0:41:29 } +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1560/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.9461334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43073 samples/s/p 0:41:29 } +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1562/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.9439217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.44086 samples/s/p 0:41:21 } +2024-07-26 00:32:16,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1564/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.941711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:16,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43159 samples/s/p 0:41:23 } +2024-07-26 00:32:19,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1566/ 1625], loss: 1.263, per_step_time: 1476ms, lr: 1.9395043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:19,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.41879 samples/s/p 0:41:26 } +2024-07-26 00:32:22,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1568/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.9372997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43488 samples/s/p 0:41:15 } +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1570/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.9350991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43843 samples/s/p 0:41:11 } +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1572/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.932897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43452 samples/s/p 0:41:10 } +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1574/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.9307017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:31,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43453 samples/s/p 0:41:07 } +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1576/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9285076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43719 samples/s/p 0:41:03 } +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1578/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.926313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:37,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43802 samples/s/p 0:40:59 } +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1580/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.9241247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:39,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43474 samples/s/p 0:40:58 } +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1582/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.921938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:42,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43265 samples/s/p 0:40:56 } +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1584/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9197541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43731 samples/s/p 0:40:51 } +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1586/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.917571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.44023 samples/s/p 0:40:46 } +2024-07-26 00:32:51,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1588/ 1625], loss: 1.420, per_step_time: 1471ms, lr: 1.9153913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:51,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43782 samples/s/p 0:40:45 } +2024-07-26 00:32:54,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1590/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.913215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43630 samples/s/p 0:40:42 } +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.9110398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43744 samples/s/p 0:40:39 } +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1594/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.908868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43990 samples/s/p 0:40:35 } +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1596/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.9066994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43462 samples/s/p 0:40:34 } +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1598/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.904531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.42807 samples/s/p 0:40:34 } +2024-07-26 00:33:09,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1600/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.9023669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:09,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43180 samples/s/p 0:40:30 } +2024-07-26 00:33:12,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1602/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.9002052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:12,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43585 samples/s/p 0:40:25 } +2024-07-26 00:33:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1604/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.8980454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43503 samples/s/p 0:40:22 } +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1606/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.8958883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43388 samples/s/p 0:40:20 } +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1608/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 1.8937328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43628 samples/s/p 0:40:16 } +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1610/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 1.8915816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43275 samples/s/p 0:40:14 } +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1612/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.8894331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43318 samples/s/p 0:40:11 } +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1614/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.8872854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43437 samples/s/p 0:40:08 } +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1616/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.8851403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.42761 samples/s/p 0:40:08 } +2024-07-26 00:33:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1618/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.8829994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:36,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43059 samples/s/p 0:40:04 } +2024-07-26 00:33:39,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1620/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.8808604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43808 samples/s/p 0:39:57 } +2024-07-26 00:33:41,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1622/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.8787222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:41,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43610 samples/s/p 0:39:55 } +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1624/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.8765884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43769 samples/s/p 0:39:52 } +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.874457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:47,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43654 samples/s/p 0:39:49 } +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 3/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.8723283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43427 samples/s/p 0:39:47 } +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 5/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8702005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43274 samples/s/p 0:39:45 } +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 7/ 1625], loss: 1.157, per_step_time: 1474ms, lr: 1.8680762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.42387 samples/s/p 0:39:46 } +2024-07-26 00:33:59,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 9/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.8659543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:59,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43333 samples/s/p 0:39:39 } +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 11/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.8638343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:02,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43946 samples/s/p 0:39:33 } +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 13/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 1.8617186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:05,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.42582 samples/s/p 0:39:36 } +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 15/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.8596038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44049 samples/s/p 0:39:27 } +2024-07-26 00:34:11,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 17/ 1625], loss: 0.964, per_step_time: 1470ms, lr: 1.8574915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:11,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43943 samples/s/p 0:39:24 } +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 19/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.8553835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43355 samples/s/p 0:39:24 } +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 21/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 1.8532755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44293 samples/s/p 0:39:17 } +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 23/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.8511719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43407 samples/s/p 0:39:18 } +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 25/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.84907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43296 samples/s/p 0:39:15 } +2024-07-26 00:34:26,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 27/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.8469707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:26,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43895 samples/s/p 0:39:10 } +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 29/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.8448749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43110 samples/s/p 0:39:10 } +2024-07-26 00:34:32,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 31/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.8427816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:32,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43583 samples/s/p 0:39:05 } +2024-07-26 00:34:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 33/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.8406874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:35,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43635 samples/s/p 0:39:02 } +2024-07-26 00:34:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 35/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.8385986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:38,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43674 samples/s/p 0:38:59 } +2024-07-26 00:34:40,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 37/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.836514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43432 samples/s/p 0:38:57 } +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 39/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.8344285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43905 samples/s/p 0:38:52 } +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 41/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.8323465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43479 samples/s/p 0:38:51 } +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 43/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.8302687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43510 samples/s/p 0:38:48 } +2024-07-26 00:34:52,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 45/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.8281928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:52,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43711 samples/s/p 0:38:44 } +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 47/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.8261185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43031 samples/s/p 0:38:44 } +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 49/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8240469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43304 samples/s/p 0:38:40 } +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 51/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.8219787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43413 samples/s/p 0:38:37 } +2024-07-26 00:35:04,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 53/ 1625], loss: 1.175, per_step_time: 1474ms, lr: 1.8199123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:04,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.42701 samples/s/p 0:38:37 } +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 55/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.8178475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43706 samples/s/p 0:38:30 } +2024-07-26 00:35:10,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 57/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 1.8157862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:10,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.44190 samples/s/p 0:38:25 } +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 59/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.8137284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43656 samples/s/p 0:38:24 } +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 61/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 1.8116714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43036 samples/s/p 0:38:24 } +2024-07-26 00:35:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 63/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.8096171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:19,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43412 samples/s/p 0:38:19 } +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 65/ 1625], loss: 0.928, per_step_time: 1472ms, lr: 1.8075671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:22,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43265 samples/s/p 0:38:17 } +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 67/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 1.8055188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42759 samples/s/p 0:38:16 } +2024-07-26 00:35:28,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 69/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 1.8034722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:28,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42504 samples/s/p 0:38:14 } +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 71/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.8014273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42857 samples/s/p 0:38:10 } +2024-07-26 00:35:34,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 73/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.7993868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:34,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43527 samples/s/p 0:38:04 } +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 75/ 1625], loss: 0.976, per_step_time: 1474ms, lr: 1.7973497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42415 samples/s/p 0:38:06 } +2024-07-26 00:35:40,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 77/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7953125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:40,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43707 samples/s/p 0:37:57 } +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 79/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 1.793279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43395 samples/s/p 0:37:56 } +2024-07-26 00:35:45,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 81/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.7912497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:45,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43421 samples/s/p 0:37:53 } +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 83/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.7892187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43239 samples/s/p 0:37:50 } +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 85/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 1.7871937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43148 samples/s/p 0:37:48 } +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 87/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.7851713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43156 samples/s/p 0:37:45 } +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 89/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.783149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:57,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42808 samples/s/p 0:37:43 } +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 91/ 1625], loss: 0.966, per_step_time: 1469ms, lr: 1.7811317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.44319 samples/s/p 0:37:34 } +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 93/ 1625], loss: 1.217, per_step_time: 1478ms, lr: 1.7791153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.41226 samples/s/p 0:37:44 } +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 95/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.7771025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:06,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.42891 samples/s/p 0:37:34 } +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 97/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.7750922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43926 samples/s/p 0:37:27 } +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 99/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.7730837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:12,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43787 samples/s/p 0:37:24 } +2024-07-26 00:36:15,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 101/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7710777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43720 samples/s/p 0:37:22 } +2024-07-26 00:36:18,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 103/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.7690743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43917 samples/s/p 0:37:18 } +2024-07-26 00:36:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 105/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7670752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43439 samples/s/p 0:37:17 } +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 107/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 1.7650761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43562 samples/s/p 0:37:14 } +2024-07-26 00:36:27,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 109/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.7630806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:27,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43552 samples/s/p 0:37:11 } +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 111/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7610876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43035 samples/s/p 0:37:10 } +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 113/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.759098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43193 samples/s/p 0:37:06 } +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 115/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.7571094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43281 samples/s/p 0:37:03 } +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 117/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.7551233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:39,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43763 samples/s/p 0:36:58 } +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 119/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7531424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:42,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43147 samples/s/p 0:36:58 } +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 121/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.7511607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.44036 samples/s/p 0:36:51 } +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 123/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.7491832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:47,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43596 samples/s/p 0:36:50 } +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 125/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.7472075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43720 samples/s/p 0:36:47 } +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 127/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.7452353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43665 samples/s/p 0:36:44 } +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 129/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7432646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43866 samples/s/p 0:36:40 } +2024-07-26 00:36:59,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 131/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.7412976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43806 samples/s/p 0:36:37 } +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 133/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.7393314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43739 samples/s/p 0:36:35 } +2024-07-26 00:37:05,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 135/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 1.7373695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:05,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43038 samples/s/p 0:36:35 } +2024-07-26 00:37:08,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 137/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.7354103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:08,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43137 samples/s/p 0:36:31 } +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 139/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.733451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43586 samples/s/p 0:36:26 } +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 141/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.7314977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43652 samples/s/p 0:36:23 } +2024-07-26 00:37:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 143/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.7295454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43158 samples/s/p 0:36:22 } +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 145/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7275947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43007 samples/s/p 0:36:20 } +2024-07-26 00:37:23,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 147/ 1625], loss: 0.965, per_step_time: 1474ms, lr: 1.7256475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:23,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42502 samples/s/p 0:36:19 } +2024-07-26 00:37:26,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 149/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 1.7237029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:26,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43120 samples/s/p 0:36:14 } +2024-07-26 00:37:29,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 151/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.7217609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:29,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42922 samples/s/p 0:36:11 } +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 153/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.7198215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43268 samples/s/p 0:36:07 } +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 155/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7178838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43283 samples/s/p 0:36:04 } +2024-07-26 00:37:38,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 157/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.7159505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:38,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43892 samples/s/p 0:35:59 } +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 159/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.7140179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43377 samples/s/p 0:35:58 } +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 161/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.712088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:43,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43800 samples/s/p 0:35:53 } +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 163/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.7101625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43690 samples/s/p 0:35:51 } +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 165/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.7082368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:49,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43444 samples/s/p 0:35:49 } +2024-07-26 00:37:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 167/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.7063146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:52,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43616 samples/s/p 0:35:45 } +2024-07-26 00:37:55,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 169/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.7043969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:55,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43357 samples/s/p 0:35:43 } +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 171/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.702479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43433 samples/s/p 0:35:40 } +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 173/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.7005664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:01,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43776 samples/s/p 0:35:36 } +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 175/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6986538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43349 samples/s/p 0:35:34 } +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 177/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 1.6967438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43321 samples/s/p 0:35:32 } +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 179/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 1.6948381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44022 samples/s/p 0:35:26 } +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 181/ 1625], loss: 1.048, per_step_time: 1469ms, lr: 1.6929341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44371 samples/s/p 0:35:22 } +2024-07-26 00:38:16,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 183/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.691031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:16,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43929 samples/s/p 0:35:20 } +2024-07-26 00:38:19,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 185/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.6891331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:19,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43493 samples/s/p 0:35:19 } +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 187/ 1625], loss: 1.160, per_step_time: 1475ms, lr: 1.6872377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42318 samples/s/p 0:35:21 } +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 189/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.6853432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43466 samples/s/p 0:35:13 } +2024-07-26 00:38:28,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 191/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6834522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43193 samples/s/p 0:35:11 } +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 193/ 1625], loss: 1.224, per_step_time: 1474ms, lr: 1.6815638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:31,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42698 samples/s/p 0:35:10 } +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 195/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.6796771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:34,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43731 samples/s/p 0:35:03 } +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 197/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 1.6777931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43415 samples/s/p 0:35:02 } +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 199/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 1.6759124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43553 samples/s/p 0:34:58 } +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 201/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.6740352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.44155 samples/s/p 0:34:53 } +2024-07-26 00:38:45,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 203/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.6721572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:45,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43340 samples/s/p 0:34:53 } +2024-07-26 00:38:48,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 205/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 1.6702834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:48,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43247 samples/s/p 0:34:51 } +2024-07-26 00:38:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 207/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.6684139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43538 samples/s/p 0:34:47 } +2024-07-26 00:38:54,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 209/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.6665446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:54,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43644 samples/s/p 0:34:43 } +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 211/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 1.6646795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:57,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.42987 samples/s/p 0:34:43 } +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 213/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.662817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43013 samples/s/p 0:34:40 } +2024-07-26 00:39:03,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 215/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:03,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43534 samples/s/p 0:34:35 } +2024-07-26 00:39:06,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 217/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.659098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:06,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43997 samples/s/p 0:34:30 } +2024-07-26 00:39:09,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 219/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.6572433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:09,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43521 samples/s/p 0:34:29 } +2024-07-26 00:39:12,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 221/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.6553886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:12,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43247 samples/s/p 0:34:27 } +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 223/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.6535391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43598 samples/s/p 0:34:23 } +2024-07-26 00:39:18,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 225/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.6516913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:18,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.44153 samples/s/p 0:34:18 } +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 227/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.6498452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43029 samples/s/p 0:34:19 } +2024-07-26 00:39:24,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 229/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.6480035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:24,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43520 samples/s/p 0:34:14 } +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 231/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.6461626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43430 samples/s/p 0:34:12 } +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 233/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.644326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43419 samples/s/p 0:34:09 } +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 235/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.6424902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43899 samples/s/p 0:34:04 } +2024-07-26 00:39:36,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 237/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.6406572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:36,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43372 samples/s/p 0:34:03 } +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 239/ 1625], loss: 1.005, per_step_time: 1471ms, lr: 1.6388275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:39,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43843 samples/s/p 0:33:58 } +2024-07-26 00:39:42,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 241/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.6369995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:42,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43827 samples/s/p 0:33:55 } +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 243/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.6351751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43550 samples/s/p 0:33:54 } +2024-07-26 00:39:47,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 245/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.6333532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:47,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43802 samples/s/p 0:33:50 } +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 247/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.6315331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43967 samples/s/p 0:33:46 } +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 249/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.6297164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43231 samples/s/p 0:33:46 } +2024-07-26 00:39:56,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 251/ 1625], loss: 1.268, per_step_time: 1473ms, lr: 1.6279023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:56,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43063 samples/s/p 0:33:44 } +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 253/ 1625], loss: 0.906, per_step_time: 1472ms, lr: 1.626089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:59,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43180 samples/s/p 0:33:40 } +2024-07-26 00:40:02,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 255/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 1.6242784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:02,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43047 samples/s/p 0:33:38 } +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 257/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.6224739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:05,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43562 samples/s/p 0:33:33 } +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 259/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 1.6206675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:08,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43863 samples/s/p 0:33:29 } +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 261/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.618868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43693 samples/s/p 0:33:27 } +2024-07-26 00:40:14,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 263/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.6170687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43767 samples/s/p 0:33:23 } +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 265/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.6152701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:17,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43702 samples/s/p 0:33:21 } +2024-07-26 00:40:20,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 267/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.6134777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:20,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.44002 samples/s/p 0:33:17 } +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 269/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.611686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:23,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43670 samples/s/p 0:33:15 } +2024-07-26 00:40:26,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 271/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.609897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:26,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43272 samples/s/p 0:33:13 } +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 273/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6081106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:29,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43462 samples/s/p 0:33:10 } +2024-07-26 00:40:32,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 275/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6063259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43783 samples/s/p 0:33:06 } +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 277/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.6045447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44002 samples/s/p 0:33:02 } +2024-07-26 00:40:38,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 279/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.6027659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:38,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44046 samples/s/p 0:32:59 } +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 281/ 1625], loss: 1.128, per_step_time: 1469ms, lr: 1.6009908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:41,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44229 samples/s/p 0:32:55 } +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 283/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.5992164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:43,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43660 samples/s/p 0:32:54 } +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 285/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.5974456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43827 samples/s/p 0:32:51 } +2024-07-26 00:40:49,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 287/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.5956773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:49,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43912 samples/s/p 0:32:47 } +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 289/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.5939098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43084 samples/s/p 0:32:48 } +2024-07-26 00:40:55,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 291/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.5921476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:55,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43394 samples/s/p 0:32:43 } +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 293/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.590387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:58,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43833 samples/s/p 0:32:39 } +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 295/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.5886292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43919 samples/s/p 0:32:36 } +2024-07-26 00:41:04,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 297/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5868729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:04,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43400 samples/s/p 0:32:35 } +2024-07-26 00:41:07,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 299/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.5851193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:07,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.42969 samples/s/p 0:32:33 } +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 301/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.58337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:10,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43517 samples/s/p 0:32:28 } +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 303/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.5816208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43762 samples/s/p 0:32:24 } +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 305/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.5798759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:16,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44122 samples/s/p 0:32:20 } +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 307/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.5781335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43555 samples/s/p 0:32:19 } +2024-07-26 00:41:22,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 309/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.5763919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:22,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43113 samples/s/p 0:32:18 } +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 311/ 1625], loss: 0.902, per_step_time: 1470ms, lr: 1.5746565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44141 samples/s/p 0:32:11 } +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 313/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 1.5729202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44214 samples/s/p 0:32:08 } +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 315/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.5711882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43445 samples/s/p 0:32:08 } +2024-07-26 00:41:34,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 317/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5694588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:34,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43618 samples/s/p 0:32:04 } +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 319/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.5677294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43818 samples/s/p 0:32:01 } +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 321/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 1.5660053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43443 samples/s/p 0:31:59 } +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 323/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 1.5642827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43301 samples/s/p 0:31:57 } +2024-07-26 00:41:45,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 325/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.5625645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43936 samples/s/p 0:31:51 } +2024-07-26 00:41:48,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 327/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.5608464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:48,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43104 samples/s/p 0:31:51 } +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 329/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 1.5591326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:51,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43539 samples/s/p 0:31:47 } +2024-07-26 00:41:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 331/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.5574204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:54,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43792 samples/s/p 0:31:43 } +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 333/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.55571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43779 samples/s/p 0:31:40 } +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 335/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.554004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43409 samples/s/p 0:31:39 } +2024-07-26 00:42:03,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 337/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5523005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:03,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43682 samples/s/p 0:31:35 } +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 339/ 1625], loss: 0.954, per_step_time: 1473ms, lr: 1.5505988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.42788 samples/s/p 0:31:35 } +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 341/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.5488988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43833 samples/s/p 0:31:28 } +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 343/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.547204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43926 samples/s/p 0:31:25 } +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 345/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.54551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:15,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43228 samples/s/p 0:31:25 } +2024-07-26 00:42:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 347/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.5438169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43465 samples/s/p 0:31:21 } +2024-07-26 00:42:21,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 349/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.542129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43210 samples/s/p 0:31:19 } +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 351/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5404419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43376 samples/s/p 0:31:15 } +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 353/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.5387584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43522 samples/s/p 0:31:12 } +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 355/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 1.5370773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:30,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43017 samples/s/p 0:31:11 } +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.535399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:33,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.44173 samples/s/p 0:31:04 } +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 359/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.5337239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43915 samples/s/p 0:31:02 } +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 361/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5320508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43511 samples/s/p 0:31:00 } +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 363/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 1.5303801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43844 samples/s/p 0:30:56 } +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 365/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 1.5287121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.42649 samples/s/p 0:30:57 } +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 367/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.5270457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:47,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43391 samples/s/p 0:30:52 } +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 369/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.5253838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43601 samples/s/p 0:30:48 } +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 371/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.5237226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43584 samples/s/p 0:30:45 } +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 373/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.5220651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:56,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43392 samples/s/p 0:30:43 } +2024-07-26 00:42:59,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 375/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.5204091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:59,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43424 samples/s/p 0:30:40 } +2024-07-26 00:43:02,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 377/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5187566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:02,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43151 samples/s/p 0:30:38 } +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 379/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5171067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43775 samples/s/p 0:30:33 } +2024-07-26 00:43:08,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 381/ 1625], loss: 1.298, per_step_time: 1470ms, lr: 1.5154585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:08,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.44076 samples/s/p 0:30:29 } +2024-07-26 00:43:11,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 383/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.5138147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42981 samples/s/p 0:30:29 } +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 385/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.5121725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.44106 samples/s/p 0:30:23 } +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 387/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5105331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43272 samples/s/p 0:30:23 } +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 389/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.5088945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43252 samples/s/p 0:30:20 } +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 391/ 1625], loss: 0.913, per_step_time: 1471ms, lr: 1.5072601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43552 samples/s/p 0:30:16 } +2024-07-26 00:43:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 393/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5056283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43754 samples/s/p 0:30:12 } +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 395/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.5039984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43785 samples/s/p 0:30:09 } +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 397/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.5023718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42401 samples/s/p 0:30:11 } +2024-07-26 00:43:35,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 399/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 1.5007479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:35,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43959 samples/s/p 0:30:03 } +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 401/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.4991265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43544 samples/s/p 0:30:01 } +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 403/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.4975077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43647 samples/s/p 0:29:58 } +2024-07-26 00:43:43,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 405/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.4958907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:43,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43601 samples/s/p 0:29:55 } +2024-07-26 00:43:46,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 407/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.4942771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:46,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43849 samples/s/p 0:29:51 } +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 409/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 1.4926661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43889 samples/s/p 0:29:48 } +2024-07-26 00:43:52,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 411/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.4910568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:52,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43766 samples/s/p 0:29:46 } +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 413/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.489451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:55,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43859 samples/s/p 0:29:42 } +2024-07-26 00:43:58,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 415/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.4878469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:58,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43395 samples/s/p 0:29:41 } +2024-07-26 00:44:01,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 417/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.4862454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:01,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44077 samples/s/p 0:29:36 } +2024-07-26 00:44:04,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 419/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.4846482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:04,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43667 samples/s/p 0:29:34 } +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 421/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.4830528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43861 samples/s/p 0:29:31 } +2024-07-26 00:44:10,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 423/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.4814591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:10,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43521 samples/s/p 0:29:29 } +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 425/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.4798671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:13,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44468 samples/s/p 0:29:23 } +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 427/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.4782795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43591 samples/s/p 0:29:23 } +2024-07-26 00:44:19,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 429/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.4766936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:19,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43539 samples/s/p 0:29:20 } +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 431/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.475112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43397 samples/s/p 0:29:17 } +2024-07-26 00:44:25,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 433/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.4735303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:25,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43107 samples/s/p 0:29:15 } +2024-07-26 00:44:28,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 435/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.471953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:28,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43627 samples/s/p 0:29:11 } +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 437/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4703784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43038 samples/s/p 0:29:10 } +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 439/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 1.4688054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42958 samples/s/p 0:29:07 } +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 441/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.4672358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43635 samples/s/p 0:29:02 } +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 443/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.4656689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43130 samples/s/p 0:29:01 } +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 445/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.4641038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42990 samples/s/p 0:28:58 } +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.4625411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:45,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43693 samples/s/p 0:28:53 } +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 449/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.4609811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43757 samples/s/p 0:28:50 } +2024-07-26 00:44:51,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 451/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.4594247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:51,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43404 samples/s/p 0:28:48 } +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 453/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4578698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43210 samples/s/p 0:28:46 } +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 455/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.4563193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43269 samples/s/p 0:28:42 } +2024-07-26 00:45:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 457/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4547705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:00,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43556 samples/s/p 0:28:39 } +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 459/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 1.4532227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.42554 samples/s/p 0:28:39 } +2024-07-26 00:45:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 461/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.451679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:06,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43784 samples/s/p 0:28:32 } +2024-07-26 00:45:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 463/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 1.4501372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:09,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43892 samples/s/p 0:28:29 } +2024-07-26 00:45:12,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 465/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.4485988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43849 samples/s/p 0:28:26 } +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 467/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.447063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43429 samples/s/p 0:28:24 } +2024-07-26 00:45:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 469/ 1625], loss: 0.997, per_step_time: 1469ms, lr: 1.4455297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44257 samples/s/p 0:28:19 } +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 471/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4439984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43164 samples/s/p 0:28:19 } +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 473/ 1625], loss: 1.298, per_step_time: 1469ms, lr: 1.4424686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44419 samples/s/p 0:28:12 } +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 475/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.4409432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43260 samples/s/p 0:28:13 } +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 477/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.4394203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:30,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43467 samples/s/p 0:28:09 } +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 479/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4378983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44145 samples/s/p 0:28:04 } +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 481/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.4363816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43442 samples/s/p 0:28:04 } +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 483/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.4348656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43869 samples/s/p 0:27:59 } +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 485/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.433354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.42949 samples/s/p 0:27:59 } +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 487/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 1.4318424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.44027 samples/s/p 0:27:53 } +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 489/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.4303342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:47,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43776 samples/s/p 0:27:51 } +2024-07-26 00:45:50,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 491/ 1625], loss: 1.108, per_step_time: 1477ms, lr: 1.4288304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.41370 samples/s/p 0:27:55 } +2024-07-26 00:45:53,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4273274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:53,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43267 samples/s/p 0:27:46 } +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 495/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.4258262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.44186 samples/s/p 0:27:41 } +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 497/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.4243302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:59,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43785 samples/s/p 0:27:39 } +2024-07-26 00:46:02,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 499/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.4228359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43556 samples/s/p 0:27:37 } +2024-07-26 00:46:05,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.4213441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:05,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.42076 samples/s/p 0:27:38 } +2024-07-26 00:46:08,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 503/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 1.4198541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:08,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43775 samples/s/p 0:27:30 } +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 505/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 1.4183668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43833 samples/s/p 0:27:27 } +2024-07-26 00:46:14,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 507/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4168819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:14,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43404 samples/s/p 0:27:25 } +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 509/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.4154006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43771 samples/s/p 0:27:21 } +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 511/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.4139218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43664 samples/s/p 0:27:19 } +2024-07-26 00:46:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 513/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.4124456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43338 samples/s/p 0:27:17 } +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 515/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.4109712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:26,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43717 samples/s/p 0:27:13 } +2024-07-26 00:46:29,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 517/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4094985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:29,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43238 samples/s/p 0:27:11 } +2024-07-26 00:46:32,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 519/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.4080318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:32,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42684 samples/s/p 0:27:10 } +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 521/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.4065643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:35,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43035 samples/s/p 0:27:06 } +2024-07-26 00:46:38,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 523/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.405102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:38,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42650 samples/s/p 0:27:04 } +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 525/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.4036414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43417 samples/s/p 0:26:59 } +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 527/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.4021816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43840 samples/s/p 0:26:55 } +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 529/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 1.4007279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.44260 samples/s/p 0:26:50 } +2024-07-26 00:46:49,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 531/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.3992742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:49,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43717 samples/s/p 0:26:49 } +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 533/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.3978214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43307 samples/s/p 0:26:47 } +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 535/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3963754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43779 samples/s/p 0:26:43 } +2024-07-26 00:46:58,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 537/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.3949305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:58,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43798 samples/s/p 0:26:40 } +2024-07-26 00:47:01,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 539/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.3934862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:01,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43103 samples/s/p 0:26:39 } +2024-07-26 00:47:04,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 541/ 1625], loss: 1.221, per_step_time: 1475ms, lr: 1.3920463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:04,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.42025 samples/s/p 0:26:39 } +2024-07-26 00:47:07,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 543/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.3906099e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43847 samples/s/p 0:26:31 } +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 545/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.3891744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43466 samples/s/p 0:26:29 } +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 547/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.3877423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:13,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.44288 samples/s/p 0:26:24 } +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 549/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3863128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:16,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43654 samples/s/p 0:26:23 } +2024-07-26 00:47:19,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 551/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.3848859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:19,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43858 samples/s/p 0:26:19 } +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 553/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.3834616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43742 samples/s/p 0:26:17 } +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 555/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.3820398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43315 samples/s/p 0:26:15 } +2024-07-26 00:47:28,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 557/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3806199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:28,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43704 samples/s/p 0:26:11 } +2024-07-26 00:47:31,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 559/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.3792041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:31,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43342 samples/s/p 0:26:09 } +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 561/ 1625], loss: 1.045, per_step_time: 1469ms, lr: 1.3777885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:34,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44503 samples/s/p 0:26:03 } +2024-07-26 00:47:37,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 563/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3763797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:37,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43434 samples/s/p 0:26:03 } +2024-07-26 00:47:40,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 565/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.3749693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:40,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43483 samples/s/p 0:26:00 } +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 567/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 1.3735623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43213 samples/s/p 0:25:58 } +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 569/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 1.3721605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43629 samples/s/p 0:25:54 } +2024-07-26 00:47:48,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 571/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 1.3707577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:48,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43771 samples/s/p 0:25:50 } +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 573/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.3693602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44086 samples/s/p 0:25:46 } +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 575/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 1.3679644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.42957 samples/s/p 0:25:47 } +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 577/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 1.3665704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:57,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43420 samples/s/p 0:25:42 } +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 579/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.3651814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44060 samples/s/p 0:25:38 } +2024-07-26 00:48:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 581/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3637925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43458 samples/s/p 0:25:36 } +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 583/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.362408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43744 samples/s/p 0:25:33 } +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 585/ 1625], loss: 0.924, per_step_time: 1469ms, lr: 1.3610252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:09,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44321 samples/s/p 0:25:28 } +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 587/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.3596441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43907 samples/s/p 0:25:26 } +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 589/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.3582674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:15,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42842 samples/s/p 0:25:26 } +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 591/ 1625], loss: 1.248, per_step_time: 1474ms, lr: 1.3568914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42470 samples/s/p 0:25:24 } +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 593/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.355519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43735 samples/s/p 0:25:18 } +2024-07-26 00:48:24,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 595/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.35415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:24,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42906 samples/s/p 0:25:17 } +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 597/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.3527826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:27,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43175 samples/s/p 0:25:14 } +2024-07-26 00:48:30,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 599/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.3514189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:30,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42705 samples/s/p 0:25:12 } +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 601/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.3500568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:33,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43568 samples/s/p 0:25:07 } +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 603/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3486964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43503 samples/s/p 0:25:04 } +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 605/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.3473405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43477 samples/s/p 0:25:01 } +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 607/ 1625], loss: 1.273, per_step_time: 1470ms, lr: 1.3459869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.44085 samples/s/p 0:24:56 } +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 609/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.3446352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43635 samples/s/p 0:24:55 } +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 611/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.343287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43082 samples/s/p 0:24:53 } +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 613/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.3419404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.44206 samples/s/p 0:24:47 } +2024-07-26 00:48:53,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 615/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.3405966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:53,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43798 samples/s/p 0:24:45 } +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 617/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.3392552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:56,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43768 samples/s/p 0:24:42 } +2024-07-26 00:48:59,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 619/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.3379181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:59,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43277 samples/s/p 0:24:41 } +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 621/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3365811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:02,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43307 samples/s/p 0:24:38 } +2024-07-26 00:49:05,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 623/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.3352493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:05,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43599 samples/s/p 0:24:34 } +2024-07-26 00:49:08,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 625/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.3339184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:08,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43851 samples/s/p 0:24:30 } +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 627/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.3325899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43592 samples/s/p 0:24:28 } +2024-07-26 00:49:14,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 629/ 1625], loss: 1.174, per_step_time: 1469ms, lr: 1.331265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:14,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44281 samples/s/p 0:24:23 } +2024-07-26 00:49:17,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 631/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.3299427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43482 samples/s/p 0:24:23 } +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 633/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.3286221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43726 samples/s/p 0:24:19 } +2024-07-26 00:49:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 635/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.3273041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43578 samples/s/p 0:24:17 } +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 637/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.3259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43891 samples/s/p 0:24:13 } +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 639/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.3246776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:29,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44065 samples/s/p 0:24:09 } +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 641/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.3233682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:32,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43300 samples/s/p 0:24:08 } +2024-07-26 00:49:35,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 643/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.3220614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.44147 samples/s/p 0:24:03 } +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 645/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.3207564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43559 samples/s/p 0:24:02 } +2024-07-26 00:49:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 647/ 1625], loss: 1.140, per_step_time: 1482ms, lr: 1.319454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.39574 samples/s/p 0:24:10 } +2024-07-26 00:49:43,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 649/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3181567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:43,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43277 samples/s/p 0:23:57 } +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 651/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.3168603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.44147 samples/s/p 0:23:51 } +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 653/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.3155657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43891 samples/s/p 0:23:49 } +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 655/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.3142752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43429 samples/s/p 0:23:47 } +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 657/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3129866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.42748 samples/s/p 0:23:46 } +2024-07-26 00:49:58,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 659/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3116988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:58,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43209 samples/s/p 0:23:42 } +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 661/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.3104171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.44001 samples/s/p 0:23:37 } +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 663/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 1.3091354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43830 samples/s/p 0:23:35 } +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 665/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.3078563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43388 samples/s/p 0:23:33 } +2024-07-26 00:50:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 667/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.3065833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43203 samples/s/p 0:23:30 } +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 669/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3053102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43676 samples/s/p 0:23:26 } +2024-07-26 00:50:16,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 671/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.3040398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:16,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43399 samples/s/p 0:23:24 } +2024-07-26 00:50:19,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 673/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.302771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:19,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43771 samples/s/p 0:23:20 } +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 675/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3015066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43225 samples/s/p 0:23:19 } +2024-07-26 00:50:25,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 677/ 1625], loss: 1.006, per_step_time: 1473ms, lr: 1.3002439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:25,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42957 samples/s/p 0:23:16 } +2024-07-26 00:50:28,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 679/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2989838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:28,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43189 samples/s/p 0:23:13 } +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 681/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.2977271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:31,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43645 samples/s/p 0:23:09 } +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 683/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2964713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43529 samples/s/p 0:23:06 } +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 685/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.295219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43713 samples/s/p 0:23:03 } +2024-07-26 00:50:40,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 687/ 1625], loss: 1.003, per_step_time: 1473ms, lr: 1.2939702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:40,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42912 samples/s/p 0:23:02 } +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 689/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.2927239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43336 samples/s/p 0:22:58 } +2024-07-26 00:50:45,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 691/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.2914802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:45,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43614 samples/s/p 0:22:54 } +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 693/ 1625], loss: 0.969, per_step_time: 1471ms, lr: 1.2902383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43761 samples/s/p 0:22:51 } +2024-07-26 00:50:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 695/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2889989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44078 samples/s/p 0:22:47 } +2024-07-26 00:50:54,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 697/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.2877638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:54,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43837 samples/s/p 0:22:45 } +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 699/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.2865305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43347 samples/s/p 0:22:43 } +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 701/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 1.2852998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44105 samples/s/p 0:22:38 } +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 703/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2840708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:03,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43942 samples/s/p 0:22:36 } +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 705/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.2828461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43707 samples/s/p 0:22:33 } +2024-07-26 00:51:09,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 707/ 1625], loss: 1.046, per_step_time: 1469ms, lr: 1.2816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:09,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44326 samples/s/p 0:22:29 } +2024-07-26 00:51:12,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 709/ 1625], loss: 1.102, per_step_time: 1473ms, lr: 1.2804003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:12,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.42929 samples/s/p 0:22:29 } +2024-07-26 00:51:15,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 711/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 1.2791834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:15,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43447 samples/s/p 0:22:25 } +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 713/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.2779674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:18,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43381 samples/s/p 0:22:22 } +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 715/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.2767548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44114 samples/s/p 0:22:17 } +2024-07-26 00:51:24,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 717/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.2755448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:24,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43366 samples/s/p 0:22:16 } +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 719/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2743375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:27,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43320 samples/s/p 0:22:14 } +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 721/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.2731327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43804 samples/s/p 0:22:09 } +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 723/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.2719313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43266 samples/s/p 0:22:08 } +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 725/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.2707309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:36,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43966 samples/s/p 0:22:03 } +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 727/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.2695356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43941 samples/s/p 0:22:00 } +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 729/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.2683403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43705 samples/s/p 0:21:58 } +2024-07-26 00:51:44,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 731/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2671485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:44,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43249 samples/s/p 0:21:56 } +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 733/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.2659592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43344 samples/s/p 0:21:53 } +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 735/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 1.2647735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43507 samples/s/p 0:21:50 } +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 737/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.2635894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:53,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43415 samples/s/p 0:21:47 } +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 739/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 1.2624089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43173 samples/s/p 0:21:44 } +2024-07-26 00:51:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 741/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.26123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:59,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43509 samples/s/p 0:21:41 } +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 743/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.2600555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.42627 samples/s/p 0:21:40 } +2024-07-26 00:52:05,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 745/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.258881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:05,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43770 samples/s/p 0:21:34 } +2024-07-26 00:52:08,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 747/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.2577107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:08,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43282 samples/s/p 0:21:32 } +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 749/ 1625], loss: 1.090, per_step_time: 1480ms, lr: 1.2565431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.40518 samples/s/p 0:21:36 } +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 751/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.255378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:14,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43790 samples/s/p 0:21:25 } +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 753/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2542147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43735 samples/s/p 0:21:22 } +2024-07-26 00:52:20,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 755/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 1.2530548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:20,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43725 samples/s/p 0:21:20 } +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 757/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.2518976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.44096 samples/s/p 0:21:16 } +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 759/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.250743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:26,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43379 samples/s/p 0:21:14 } +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 761/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.2495917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43163 samples/s/p 0:21:12 } +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 763/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.2484405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43339 samples/s/p 0:21:09 } +2024-07-26 00:52:35,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 765/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.2472946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:35,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43709 samples/s/p 0:21:05 } +2024-07-26 00:52:38,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 767/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.2461494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:38,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.44117 samples/s/p 0:21:01 } +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 769/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.2450085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:41,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43877 samples/s/p 0:20:59 } +2024-07-26 00:52:44,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 771/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.2438694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:44,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43505 samples/s/p 0:20:57 } +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 773/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.2427329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43499 samples/s/p 0:20:54 } +2024-07-26 00:52:49,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 775/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.2415982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.44134 samples/s/p 0:20:49 } +2024-07-26 00:52:49,908 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:53:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 777/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 1.2404677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:25,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43130 samples/s/p 0:20:49 } +2024-07-26 00:53:28,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 779/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.2393398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43483 samples/s/p 0:20:45 } +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 781/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.2382137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43243 samples/s/p 0:20:42 } +2024-07-26 00:53:34,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 783/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.2370901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:34,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43584 samples/s/p 0:20:39 } +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 785/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.2359692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:37,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43740 samples/s/p 0:20:35 } +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 787/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.2348517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:40,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43486 samples/s/p 0:20:33 } +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 789/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.2337359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43010 samples/s/p 0:20:31 } +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 791/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2326236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43484 samples/s/p 0:20:27 } +2024-07-26 00:53:49,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 793/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.2315139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:49,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43765 samples/s/p 0:20:24 } +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 795/ 1625], loss: 1.404, per_step_time: 1470ms, lr: 1.2304059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43915 samples/s/p 0:20:20 } +2024-07-26 00:53:55,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 797/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.2293013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:55,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43984 samples/s/p 0:20:17 } +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 799/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.2281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43905 samples/s/p 0:20:14 } +2024-07-26 00:54:01,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 801/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.2271009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:01,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43630 samples/s/p 0:20:12 } +2024-07-26 00:54:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 803/ 1625], loss: 1.184, per_step_time: 1474ms, lr: 1.2260016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:04,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42408 samples/s/p 0:20:12 } +2024-07-26 00:54:07,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 805/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.2249092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:07,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44160 samples/s/p 0:20:05 } +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 807/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.2238168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:10,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43377 samples/s/p 0:20:04 } +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 809/ 1625], loss: 1.378, per_step_time: 1470ms, lr: 1.2227285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44044 samples/s/p 0:19:59 } +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 811/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 1.2216414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43490 samples/s/p 0:19:58 } +2024-07-26 00:54:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 813/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2205584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43635 samples/s/p 0:19:54 } +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 815/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2194764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43737 samples/s/p 0:19:51 } +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 817/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.2183987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44070 samples/s/p 0:19:48 } +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 819/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.2173217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:27,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43565 samples/s/p 0:19:46 } +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 821/ 1625], loss: 1.135, per_step_time: 1469ms, lr: 1.2162501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.44490 samples/s/p 0:19:41 } +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.2151784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42999 samples/s/p 0:19:41 } +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 825/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.214111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:36,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43042 samples/s/p 0:19:38 } +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 827/ 1625], loss: 1.006, per_step_time: 1474ms, lr: 1.2130454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42437 samples/s/p 0:19:36 } +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 829/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.2119832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:42,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43914 samples/s/p 0:19:30 } +2024-07-26 00:54:45,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 831/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.2109227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:45,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43273 samples/s/p 0:19:29 } +2024-07-26 00:54:48,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 833/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2098657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:48,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43228 samples/s/p 0:19:26 } +2024-07-26 00:54:51,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 835/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.2088104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:51,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43639 samples/s/p 0:19:22 } +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 837/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43131 samples/s/p 0:19:20 } +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 839/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.2067094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:57,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43404 samples/s/p 0:19:17 } +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 841/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2056628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:00,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.44071 samples/s/p 0:19:12 } +2024-07-26 00:55:03,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 843/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.2046196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:03,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43628 samples/s/p 0:19:10 } +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 845/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2035764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43213 samples/s/p 0:19:08 } +2024-07-26 00:55:09,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 847/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.2025375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:09,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43215 samples/s/p 0:19:05 } +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 849/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.2015031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43411 samples/s/p 0:19:02 } +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 851/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2004693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43753 samples/s/p 0:18:58 } +2024-07-26 00:55:18,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 853/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 1.1994383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:18,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43406 samples/s/p 0:18:56 } +2024-07-26 00:55:20,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 855/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 1.198409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:20,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43874 samples/s/p 0:18:52 } +2024-07-26 00:55:23,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 857/ 1625], loss: 1.175, per_step_time: 1475ms, lr: 1.1973831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:23,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42237 samples/s/p 0:18:53 } +2024-07-26 00:55:26,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 859/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.1963607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:26,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43209 samples/s/p 0:18:48 } +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 861/ 1625], loss: 1.147, per_step_time: 1476ms, lr: 1.1953391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.41923 samples/s/p 0:18:47 } +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 863/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.1943227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:32,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.44014 samples/s/p 0:18:40 } +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 865/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.1933064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43730 samples/s/p 0:18:38 } +2024-07-26 00:55:38,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 867/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.1922943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:38,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43258 samples/s/p 0:18:36 } +2024-07-26 00:55:41,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 869/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.1912848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:41,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43270 samples/s/p 0:18:33 } +2024-07-26 00:55:44,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 871/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1902771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:44,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.42947 samples/s/p 0:18:30 } +2024-07-26 00:55:47,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 873/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.1892737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:47,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43490 samples/s/p 0:18:26 } +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 875/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.188272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43150 samples/s/p 0:18:24 } +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 877/ 1625], loss: 1.128, per_step_time: 1473ms, lr: 1.1872712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43102 samples/s/p 0:18:21 } +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 879/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.1862755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43271 samples/s/p 0:18:18 } +2024-07-26 00:55:59,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 881/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.1852799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:59,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43380 samples/s/p 0:18:15 } +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 883/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.1842894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43420 samples/s/p 0:18:12 } +2024-07-26 00:56:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 885/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 1.1833007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:05,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43375 samples/s/p 0:18:09 } +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 887/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 1.1823155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43748 samples/s/p 0:18:05 } +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 889/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.181332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42757 samples/s/p 0:18:04 } +2024-07-26 00:56:14,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 891/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.180351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:14,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43635 samples/s/p 0:18:00 } +2024-07-26 00:56:17,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 893/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 1.1793726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:17,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43383 samples/s/p 0:17:57 } +2024-07-26 00:56:20,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 895/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 1.178396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:20,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42843 samples/s/p 0:17:55 } +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 897/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1774246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43482 samples/s/p 0:17:51 } +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 899/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.1764548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43070 samples/s/p 0:17:49 } +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 901/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1754878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43803 samples/s/p 0:17:45 } +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 903/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.1745224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43323 samples/s/p 0:17:43 } +2024-07-26 00:56:34,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 905/ 1625], loss: 0.961, per_step_time: 1473ms, lr: 1.1735588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:34,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42834 samples/s/p 0:17:41 } +2024-07-26 00:56:37,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 907/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 1.1726003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:37,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43350 samples/s/p 0:17:37 } +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 909/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.1716427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42842 samples/s/p 0:17:35 } +2024-07-26 00:56:43,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 911/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1706876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:43,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42988 samples/s/p 0:17:31 } +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 913/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.169736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43340 samples/s/p 0:17:28 } +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 915/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.168788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.44171 samples/s/p 0:17:23 } +2024-07-26 00:56:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 917/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.1678408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43587 samples/s/p 0:17:21 } +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 919/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 1.1668986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43234 samples/s/p 0:17:19 } +2024-07-26 00:56:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 921/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.1659566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43619 samples/s/p 0:17:16 } +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 923/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.1650188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:01,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43746 samples/s/p 0:17:12 } +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 925/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1640828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:04,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43396 samples/s/p 0:17:10 } +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 927/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.1631478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43936 samples/s/p 0:17:06 } +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 929/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1622195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:10,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43061 samples/s/p 0:17:05 } +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 931/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.1612905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43323 samples/s/p 0:17:01 } +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 933/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.1603656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43049 samples/s/p 0:16:59 } +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 935/ 1625], loss: 1.391, per_step_time: 1475ms, lr: 1.1594426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42257 samples/s/p 0:16:57 } +2024-07-26 00:57:22,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 937/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1585222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43617 samples/s/p 0:16:52 } +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 939/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 1.1576052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43638 samples/s/p 0:16:49 } +2024-07-26 00:57:27,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 941/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.1566899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:27,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43604 samples/s/p 0:16:46 } +2024-07-26 00:57:30,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 943/ 1625], loss: 1.395, per_step_time: 1472ms, lr: 1.1557781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:30,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43290 samples/s/p 0:16:44 } +2024-07-26 00:57:33,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 945/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.1548681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:33,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42976 samples/s/p 0:16:41 } +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 947/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.1539623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42873 samples/s/p 0:16:39 } +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 949/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.1530583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43993 samples/s/p 0:16:34 } +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 951/ 1625], loss: 1.334, per_step_time: 1473ms, lr: 1.1521586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.42759 samples/s/p 0:16:33 } +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 953/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.1512581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43381 samples/s/p 0:16:29 } +2024-07-26 00:57:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 955/ 1625], loss: 1.356, per_step_time: 1469ms, lr: 1.1503627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:48,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.44296 samples/s/p 0:16:24 } +2024-07-26 00:57:51,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 957/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.1494699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:51,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43288 samples/s/p 0:16:23 } +2024-07-26 00:57:54,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 959/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.1485771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:54,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43446 samples/s/p 0:16:20 } +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 961/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.1476903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43010 samples/s/p 0:16:18 } +2024-07-26 00:58:00,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 963/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.1468053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:00,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43740 samples/s/p 0:16:13 } +2024-07-26 00:58:03,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 965/ 1625], loss: 0.989, per_step_time: 1471ms, lr: 1.1459211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:03,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43499 samples/s/p 0:16:11 } +2024-07-26 00:58:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 967/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 1.1450413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.42921 samples/s/p 0:16:09 } +2024-07-26 00:58:09,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 969/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.1441632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:09,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43817 samples/s/p 0:16:05 } +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 971/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 1.1432877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:12,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43338 samples/s/p 0:16:02 } +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 973/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 1.1424165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43646 samples/s/p 0:15:59 } +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 975/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 1.1415462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44095 samples/s/p 0:15:55 } +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 977/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1406785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43329 samples/s/p 0:15:54 } +2024-07-26 00:58:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 979/ 1625], loss: 1.317, per_step_time: 1470ms, lr: 1.1398151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:24,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44099 samples/s/p 0:15:49 } +2024-07-26 00:58:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 981/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 1.1389534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:26,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43861 samples/s/p 0:15:47 } +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 983/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1380953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43368 samples/s/p 0:15:45 } +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 985/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1372379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:32,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43790 samples/s/p 0:15:41 } +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 987/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.1363849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43437 samples/s/p 0:15:39 } +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 989/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1355327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:38,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43388 samples/s/p 0:15:36 } +2024-07-26 00:58:41,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 991/ 1625], loss: 1.498, per_step_time: 1470ms, lr: 1.1346857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:41,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.44083 samples/s/p 0:15:32 } +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 993/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.1338395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.44199 samples/s/p 0:15:29 } +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 995/ 1625], loss: 1.396, per_step_time: 1470ms, lr: 1.1329969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43891 samples/s/p 0:15:26 } +2024-07-26 00:58:50,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 997/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.1321551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:50,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43556 samples/s/p 0:15:24 } +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 999/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.1313176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43649 samples/s/p 0:15:21 } +2024-07-26 00:58:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1001/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.1304828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42822 samples/s/p 0:15:19 } +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1003/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1296487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43538 samples/s/p 0:15:15 } +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1005/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.1288207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:02,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43422 samples/s/p 0:15:12 } +2024-07-26 00:59:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1007/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.1279928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:05,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43601 samples/s/p 0:15:09 } +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1009/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.1271692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43776 samples/s/p 0:15:06 } +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1011/ 1625], loss: 1.373, per_step_time: 1474ms, lr: 1.1263472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42614 samples/s/p 0:15:05 } +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1013/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.1255271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:14,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43206 samples/s/p 0:15:01 } +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1015/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.1247112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43530 samples/s/p 0:14:57 } +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1017/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.1238961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:20,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44014 samples/s/p 0:14:54 } +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1019/ 1625], loss: 0.968, per_step_time: 1470ms, lr: 1.1230854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43924 samples/s/p 0:14:51 } +2024-07-26 00:59:25,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1021/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.1222766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:25,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42818 samples/s/p 0:14:50 } +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1023/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.1214719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42878 samples/s/p 0:14:47 } +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1025/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.1206673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44026 samples/s/p 0:14:42 } +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1027/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.119867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43630 samples/s/p 0:14:40 } +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1029/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.1190692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43483 samples/s/p 0:14:37 } +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1031/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.1182733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44040 samples/s/p 0:14:33 } +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1033/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.1174816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43482 samples/s/p 0:14:31 } +2024-07-26 00:59:46,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1035/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 1.1166908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44492 samples/s/p 0:14:26 } +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1037/ 1625], loss: 0.916, per_step_time: 1469ms, lr: 1.1159034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44227 samples/s/p 0:14:24 } +2024-07-26 00:59:52,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1039/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.1151195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:52,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44155 samples/s/p 0:14:21 } +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1041/ 1625], loss: 0.996, per_step_time: 1470ms, lr: 1.1143366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44041 samples/s/p 0:14:18 } +2024-07-26 00:59:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1043/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.1135578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43214 samples/s/p 0:14:17 } +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1045/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.11278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:01,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.42659 samples/s/p 0:14:15 } +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1047/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.1120056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43373 samples/s/p 0:14:10 } +2024-07-26 01:00:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1049/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.1112346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:07,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.44078 samples/s/p 0:14:06 } +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1051/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 1.1104663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43157 samples/s/p 0:14:05 } +2024-07-26 01:00:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1053/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.1096997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:13,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43572 samples/s/p 0:14:01 } +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1055/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.1089375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43253 samples/s/p 0:13:59 } +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1057/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.108176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43625 samples/s/p 0:13:55 } +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1059/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.1074172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.42592 samples/s/p 0:13:54 } +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1061/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1066627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43515 samples/s/p 0:13:50 } +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1063/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 1.1059082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43263 samples/s/p 0:13:47 } +2024-07-26 01:00:30,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1065/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.1051579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:30,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43026 samples/s/p 0:13:45 } +2024-07-26 01:00:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1067/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.1044121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42950 samples/s/p 0:13:42 } +2024-07-26 01:00:36,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1069/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.1036655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:36,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43503 samples/s/p 0:13:38 } +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1071/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.1029247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43645 samples/s/p 0:13:35 } +2024-07-26 01:00:42,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1073/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.1021832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:42,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42858 samples/s/p 0:13:33 } +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1075/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 1.1014486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43039 samples/s/p 0:13:30 } +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1077/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.1007139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:48,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43423 samples/s/p 0:13:26 } +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1079/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0999811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43571 samples/s/p 0:13:23 } +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1081/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.0992525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:54,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43790 samples/s/p 0:13:20 } +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1083/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.0985265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43206 samples/s/p 0:13:18 } +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1085/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.0978031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43869 samples/s/p 0:13:14 } +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1087/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:03,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43725 samples/s/p 0:13:11 } +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1089/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.0963632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43338 samples/s/p 0:13:09 } +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1091/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.0956476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43865 samples/s/p 0:13:05 } +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1093/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.0949345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43385 samples/s/p 0:13:03 } +2024-07-26 01:01:15,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1095/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.094225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43159 samples/s/p 0:13:00 } +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1097/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0935163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43419 samples/s/p 0:12:57 } +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1099/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 1.0928111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:21,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43630 samples/s/p 0:12:54 } +2024-07-26 01:01:24,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1101/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.0921093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:24,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43428 samples/s/p 0:12:51 } +2024-07-26 01:01:26,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1103/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.0914084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:26,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43808 samples/s/p 0:12:47 } +2024-07-26 01:01:29,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 1.0907135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43890 samples/s/p 0:12:44 } +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1107/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.0900178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44093 samples/s/p 0:12:41 } +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1109/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 1.0893273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:35,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43963 samples/s/p 0:12:38 } +2024-07-26 01:01:38,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1111/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0886375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:38,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43441 samples/s/p 0:12:36 } +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1113/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0879496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44159 samples/s/p 0:12:32 } +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1115/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0872668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43822 samples/s/p 0:12:30 } +2024-07-26 01:01:47,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1117/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0865875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:47,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43623 samples/s/p 0:12:27 } +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1119/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 1.0859081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43133 samples/s/p 0:12:25 } +2024-07-26 01:01:53,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1121/ 1625], loss: 1.209, per_step_time: 1469ms, lr: 1.0852315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.44219 samples/s/p 0:12:20 } +2024-07-26 01:01:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1123/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.084559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43458 samples/s/p 0:12:18 } +2024-07-26 01:01:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1125/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.0838884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:59,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43121 samples/s/p 0:12:16 } +2024-07-26 01:02:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1127/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.0832194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:02,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43644 samples/s/p 0:12:12 } +2024-07-26 01:02:05,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1129/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0825556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:05,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43479 samples/s/p 0:12:10 } +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1131/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.0818919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43573 samples/s/p 0:12:07 } +2024-07-26 01:02:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1133/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 1.0812325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43398 samples/s/p 0:12:04 } +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1135/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.0805747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.44004 samples/s/p 0:12:00 } +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1137/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.0799223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43832 samples/s/p 0:11:57 } +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1139/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.0792688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43629 samples/s/p 0:11:55 } +2024-07-26 01:02:23,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1141/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.0786198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:23,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43712 samples/s/p 0:11:52 } +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1143/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.0779751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43470 samples/s/p 0:11:49 } +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1145/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.0773304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43851 samples/s/p 0:11:46 } +2024-07-26 01:02:31,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1147/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.076689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:31,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43714 samples/s/p 0:11:43 } +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1149/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.0760511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43415 samples/s/p 0:11:40 } +2024-07-26 01:02:37,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1151/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.0754143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:37,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43362 samples/s/p 0:11:37 } +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1153/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.0747824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.44023 samples/s/p 0:11:34 } +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1155/ 1625], loss: 1.252, per_step_time: 1469ms, lr: 1.0741506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:43,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.44300 samples/s/p 0:11:30 } +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1157/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 1.0735232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:46,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43469 samples/s/p 0:11:28 } +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1159/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0728984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43512 samples/s/p 0:11:25 } +2024-07-26 01:02:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1161/ 1625], loss: 0.912, per_step_time: 1471ms, lr: 1.0722744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43564 samples/s/p 0:11:22 } +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1163/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.0716547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43631 samples/s/p 0:11:19 } +2024-07-26 01:02:58,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1165/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.0710376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:58,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.42792 samples/s/p 0:11:17 } +2024-07-26 01:03:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1167/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 1.070424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43305 samples/s/p 0:11:14 } +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1169/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.0698112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43799 samples/s/p 0:11:10 } +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1171/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.0692028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:07,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43765 samples/s/p 0:11:07 } +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1173/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.0685951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:10,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43277 samples/s/p 0:11:05 } +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1175/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0679919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43568 samples/s/p 0:11:02 } +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1177/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.0673913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43658 samples/s/p 0:10:59 } +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1179/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.0667932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43149 samples/s/p 0:10:56 } +2024-07-26 01:03:22,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1181/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0661968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:22,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43544 samples/s/p 0:10:53 } +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1183/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.0656022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43959 samples/s/p 0:10:50 } +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1185/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.0650127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:27,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42971 samples/s/p 0:10:48 } +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1187/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0644251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43152 samples/s/p 0:10:45 } +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1189/ 1625], loss: 1.031, per_step_time: 1474ms, lr: 1.0638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:33,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42724 samples/s/p 0:10:42 } +2024-07-26 01:03:36,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1191/ 1625], loss: 0.941, per_step_time: 1473ms, lr: 1.0632566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42946 samples/s/p 0:10:39 } +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1193/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.0626775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:39,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43817 samples/s/p 0:10:35 } +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1195/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.0621011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43340 samples/s/p 0:10:33 } +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1197/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 1.0615246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.44049 samples/s/p 0:10:29 } +2024-07-26 01:03:48,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1199/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 1.0609533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:48,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43070 samples/s/p 0:10:27 } +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1201/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.0603829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43159 samples/s/p 0:10:24 } +2024-07-26 01:03:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1203/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0598177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43418 samples/s/p 0:10:21 } +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1205/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.0592541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43647 samples/s/p 0:10:18 } +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1207/ 1625], loss: 0.954, per_step_time: 1472ms, lr: 1.0586924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43469 samples/s/p 0:10:15 } +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1209/ 1625], loss: 0.949, per_step_time: 1470ms, lr: 1.0581332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43876 samples/s/p 0:10:11 } +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1211/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0575784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:06,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43052 samples/s/p 0:10:09 } +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1213/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.0570244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43334 samples/s/p 0:10:06 } +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1215/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 1.0564738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:12,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43805 samples/s/p 0:10:03 } +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1217/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.0559268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43180 samples/s/p 0:10:00 } +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1219/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 1.0553805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43035 samples/s/p 0:09:58 } +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1221/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0548387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43175 samples/s/p 0:09:55 } +2024-07-26 01:04:24,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1223/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.0542967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.44077 samples/s/p 0:09:51 } +2024-07-26 01:04:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1225/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.0537617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43501 samples/s/p 0:09:48 } +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1227/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0532268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43633 samples/s/p 0:09:45 } +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1229/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0526935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43658 samples/s/p 0:09:42 } +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1231/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.0521646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43329 samples/s/p 0:09:40 } +2024-07-26 01:04:38,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1233/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0516374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:38,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43173 samples/s/p 0:09:37 } +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1235/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.0511145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:41,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43493 samples/s/p 0:09:34 } +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1237/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.0505934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.44203 samples/s/p 0:09:30 } +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1239/ 1625], loss: 1.200, per_step_time: 1475ms, lr: 1.0500747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.42075 samples/s/p 0:09:29 } +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1241/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.0495597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43343 samples/s/p 0:09:25 } +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1243/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.0490463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:53,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43738 samples/s/p 0:09:22 } +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1245/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 1.0485355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44157 samples/s/p 0:09:18 } +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1247/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 1.0480273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43496 samples/s/p 0:09:16 } +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1249/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.0475218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:02,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43223 samples/s/p 0:09:13 } +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1251/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 1.0470196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43456 samples/s/p 0:09:10 } +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1253/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.0465192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:08,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43639 samples/s/p 0:09:07 } +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1255/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.0460213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.42683 samples/s/p 0:09:05 } +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1257/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 1.0455278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:14,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44151 samples/s/p 0:09:01 } +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1259/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0450344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43722 samples/s/p 0:08:58 } +2024-07-26 01:05:20,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.044546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:20,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43767 samples/s/p 0:08:55 } +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1263/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.0440604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43215 samples/s/p 0:08:53 } +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1265/ 1625], loss: 0.953, per_step_time: 1471ms, lr: 1.0435755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43682 samples/s/p 0:08:49 } +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1267/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.0430958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.44058 samples/s/p 0:08:46 } +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1269/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0426162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43825 samples/s/p 0:08:43 } +2024-07-26 01:05:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1271/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.042139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43753 samples/s/p 0:08:40 } +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1273/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.0416654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43200 samples/s/p 0:08:38 } +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1275/ 1625], loss: 0.948, per_step_time: 1470ms, lr: 1.0411961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.44016 samples/s/p 0:08:34 } +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1277/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.0407277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44186 samples/s/p 0:08:31 } +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1279/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.0402645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43122 samples/s/p 0:08:29 } +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1281/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.0398012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:49,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43991 samples/s/p 0:08:25 } +2024-07-26 01:05:52,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1283/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.0393405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:52,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43490 samples/s/p 0:08:23 } +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1285/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0388834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:55,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43301 samples/s/p 0:08:20 } +2024-07-26 01:05:58,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1287/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0384288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:58,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43317 samples/s/p 0:08:17 } +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1289/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.0379767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43376 samples/s/p 0:08:14 } +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1291/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.0375273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43757 samples/s/p 0:08:11 } +2024-07-26 01:06:07,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1293/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.0370796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:07,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.42823 samples/s/p 0:08:09 } +2024-07-26 01:06:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1295/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0366372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43281 samples/s/p 0:08:05 } +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1297/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.0361964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:13,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43502 samples/s/p 0:08:02 } +2024-07-26 01:06:16,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1299/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.0357581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:16,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43857 samples/s/p 0:07:59 } +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1301/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.0353217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43759 samples/s/p 0:07:56 } +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1303/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.034887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43719 samples/s/p 0:07:53 } +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1305/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.0344575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43968 samples/s/p 0:07:50 } +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1307/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.0340297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43305 samples/s/p 0:07:48 } +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1309/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0336053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:30,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43078 samples/s/p 0:07:45 } +2024-07-26 01:06:33,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1311/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.0331818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:33,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43425 samples/s/p 0:07:42 } +2024-07-26 01:06:36,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1313/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.0327626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:36,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43238 samples/s/p 0:07:39 } +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1315/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.0323444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44124 samples/s/p 0:07:35 } +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1317/ 1625], loss: 1.289, per_step_time: 1469ms, lr: 1.0319303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44284 samples/s/p 0:07:32 } +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1319/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0315181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43477 samples/s/p 0:07:30 } +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1321/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.0311085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44080 samples/s/p 0:07:26 } +2024-07-26 01:06:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1323/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.0307023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43548 samples/s/p 0:07:24 } +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1325/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.0302995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43192 samples/s/p 0:07:21 } +2024-07-26 01:06:57,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1327/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0298976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43751 samples/s/p 0:07:18 } +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1329/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43756 samples/s/p 0:07:15 } +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1331/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0291034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43223 samples/s/p 0:07:12 } +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1333/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.0287101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43421 samples/s/p 0:07:09 } +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1335/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.0283194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43265 samples/s/p 0:07:07 } +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1337/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.0279323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:12,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43272 samples/s/p 0:07:04 } +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1339/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.0275477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:15,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43650 samples/s/p 0:07:00 } +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1341/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.0271639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42826 samples/s/p 0:06:58 } +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1343/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0267854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43148 samples/s/p 0:06:55 } +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1345/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.0264085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43347 samples/s/p 0:06:52 } +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1347/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.0260335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.44025 samples/s/p 0:06:48 } +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1349/ 1625], loss: 1.021, per_step_time: 1473ms, lr: 1.0256618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42899 samples/s/p 0:06:46 } +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1351/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.025291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43133 samples/s/p 0:06:43 } +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1353/ 1625], loss: 1.098, per_step_time: 1479ms, lr: 1.0249263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.40721 samples/s/p 0:06:42 } +2024-07-26 01:07:38,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1355/ 1625], loss: 1.032, per_step_time: 1473ms, lr: 1.0245616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:38,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42760 samples/s/p 0:06:37 } +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1357/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0242012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:41,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43219 samples/s/p 0:06:34 } +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1359/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.0238425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:44,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43479 samples/s/p 0:06:31 } +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1361/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0234857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:47,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.44006 samples/s/p 0:06:28 } +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1363/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.023133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43319 samples/s/p 0:06:25 } +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1365/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.022783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:53,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43644 samples/s/p 0:06:22 } +2024-07-26 01:07:56,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1367/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0224346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:56,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43240 samples/s/p 0:06:19 } +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1369/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0220889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:59,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43366 samples/s/p 0:06:16 } +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1371/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.0217484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.44057 samples/s/p 0:06:13 } +2024-07-26 01:08:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1373/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0214079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43407 samples/s/p 0:06:10 } +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1375/ 1625], loss: 1.065, per_step_time: 1469ms, lr: 1.0210725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:08,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44304 samples/s/p 0:06:07 } +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1377/ 1625], loss: 0.925, per_step_time: 1470ms, lr: 1.0207364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44103 samples/s/p 0:06:04 } +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1379/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 1.0204053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43523 samples/s/p 0:06:02 } +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1381/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.0200761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:17,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42795 samples/s/p 0:05:59 } +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1383/ 1625], loss: 1.464, per_step_time: 1473ms, lr: 1.0197493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42799 samples/s/p 0:05:56 } +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1385/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.0194253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43856 samples/s/p 0:05:53 } +2024-07-26 01:08:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1387/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.0191037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43065 samples/s/p 0:05:50 } +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1389/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.0187874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43006 samples/s/p 0:05:47 } +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1391/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.0184702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44206 samples/s/p 0:05:43 } +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1393/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 1.0181583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:34,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.42912 samples/s/p 0:05:41 } +2024-07-26 01:08:37,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1395/ 1625], loss: 1.095, per_step_time: 1469ms, lr: 1.017848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:37,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44280 samples/s/p 0:05:38 } +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1397/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0175395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43650 samples/s/p 0:05:35 } +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1399/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.0172334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43633 samples/s/p 0:05:32 } +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1401/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0169335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43345 samples/s/p 0:05:29 } +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1403/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0166336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43509 samples/s/p 0:05:26 } +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1405/ 1625], loss: 1.306, per_step_time: 1471ms, lr: 1.0163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43538 samples/s/p 0:05:23 } +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1407/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 1.0160417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43972 samples/s/p 0:05:20 } +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1409/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.0157504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43824 samples/s/p 0:05:17 } +2024-07-26 01:09:01,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1411/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0154608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:01,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43547 samples/s/p 0:05:14 } +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1413/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.0151748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43223 samples/s/p 0:05:12 } +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1415/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0148922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43494 samples/s/p 0:05:09 } +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1417/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 1.0146105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:10,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.42524 samples/s/p 0:05:06 } +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1419/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.0143322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43520 samples/s/p 0:05:03 } +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1421/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.0140565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.44083 samples/s/p 0:04:59 } +2024-07-26 01:09:19,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1423/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 1.0137842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:19,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44105 samples/s/p 0:04:57 } +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1425/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.0135137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44349 samples/s/p 0:04:53 } +2024-07-26 01:09:25,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1427/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.0132458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43471 samples/s/p 0:04:51 } +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1429/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0129821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43690 samples/s/p 0:04:48 } +2024-07-26 01:09:30,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1431/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.0127186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43030 samples/s/p 0:04:45 } +2024-07-26 01:09:33,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1433/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 1.0124593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44021 samples/s/p 0:04:42 } +2024-07-26 01:09:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1435/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0122026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43835 samples/s/p 0:04:39 } +2024-07-26 01:09:39,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1437/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.0119476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43654 samples/s/p 0:04:36 } +2024-07-26 01:09:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1439/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.0116961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.42985 samples/s/p 0:04:34 } +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1441/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 1.0114472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43753 samples/s/p 0:04:30 } +2024-07-26 01:09:48,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1443/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.0112018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:48,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43613 samples/s/p 0:04:27 } +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1445/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.010958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43372 samples/s/p 0:04:25 } +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.0107178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43641 samples/s/p 0:04:21 } +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1449/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0104792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43150 samples/s/p 0:04:19 } +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1451/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0102442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43404 samples/s/p 0:04:16 } +2024-07-26 01:10:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1453/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0100108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:03,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43580 samples/s/p 0:04:13 } +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1455/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.0097809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43857 samples/s/p 0:04:10 } +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1457/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 1.0095536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:09,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43461 samples/s/p 0:04:07 } +2024-07-26 01:10:12,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1459/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.0093289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43403 samples/s/p 0:04:04 } +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1461/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0091077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:15,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43826 samples/s/p 0:04:01 } +2024-07-26 01:10:18,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1463/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.0088872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43459 samples/s/p 0:03:58 } +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1465/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.008672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43584 samples/s/p 0:03:55 } +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1467/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.008456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:24,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43280 samples/s/p 0:03:52 } +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1469/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 1.0082451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.44475 samples/s/p 0:03:49 } +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1471/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.0080369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43256 samples/s/p 0:03:46 } +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1473/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.0078303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43500 samples/s/p 0:03:43 } +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1475/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 1.007628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.44074 samples/s/p 0:03:40 } +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1477/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.0074266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43940 samples/s/p 0:03:37 } +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1479/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0072288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43120 samples/s/p 0:03:35 } +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1481/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.0070335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43092 samples/s/p 0:03:32 } +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1483/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 1.0068399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43083 samples/s/p 0:03:29 } +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1485/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.0066514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43402 samples/s/p 0:03:26 } +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1487/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 1.0064639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43163 samples/s/p 0:03:23 } +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1489/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.0062789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43986 samples/s/p 0:03:20 } +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1491/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0060966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:59,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43825 samples/s/p 0:03:17 } +2024-07-26 01:11:02,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1493/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.0059176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:02,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.44126 samples/s/p 0:03:14 } +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1495/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.0057405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:05,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43187 samples/s/p 0:03:11 } +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1497/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 1.0055668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43517 samples/s/p 0:03:08 } +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1499/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.0053948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:11,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43444 samples/s/p 0:03:05 } +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1501/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0052271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43922 samples/s/p 0:03:02 } +2024-07-26 01:11:17,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1503/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 1.0050603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:17,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.42541 samples/s/p 0:02:59 } +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1505/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 1.0048986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43455 samples/s/p 0:02:56 } +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1507/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 1.0047371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43479 samples/s/p 0:02:53 } +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1509/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.0045788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42889 samples/s/p 0:02:50 } +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1511/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0044242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43531 samples/s/p 0:02:47 } +2024-07-26 01:11:31,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1513/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.0042712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:31,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.44138 samples/s/p 0:02:44 } +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1515/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.00412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:34,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43741 samples/s/p 0:02:41 } +2024-07-26 01:11:37,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1517/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.0039756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:37,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43790 samples/s/p 0:02:38 } +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1519/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0038295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43760 samples/s/p 0:02:35 } +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1521/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 1.0036896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43892 samples/s/p 0:02:32 } +2024-07-26 01:11:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1523/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.0035478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:46,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.44054 samples/s/p 0:02:29 } +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1525/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.0034121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43409 samples/s/p 0:02:27 } +2024-07-26 01:11:52,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1527/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.0032782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:52,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43362 samples/s/p 0:02:24 } +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1529/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.0031486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43579 samples/s/p 0:02:21 } +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1531/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.0030188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43680 samples/s/p 0:02:18 } +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1533/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0028936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43541 samples/s/p 0:02:15 } +2024-07-26 01:12:04,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1535/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 1.0027709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:04,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43432 samples/s/p 0:02:12 } +2024-07-26 01:12:07,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1537/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 1.0026498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:07,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42327 samples/s/p 0:02:09 } +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1539/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 1.0025315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43934 samples/s/p 0:02:06 } +2024-07-26 01:12:13,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1541/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.0024182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:13,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43811 samples/s/p 0:02:03 } +2024-07-26 01:12:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1543/ 1625], loss: 1.210, per_step_time: 1475ms, lr: 1.0023033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:16,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42202 samples/s/p 0:02:00 } +2024-07-26 01:12:19,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1545/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0021944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:19,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43524 samples/s/p 0:01:57 } +2024-07-26 01:12:22,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1547/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.0020872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:22,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43276 samples/s/p 0:01:54 } +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1549/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.0019844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43358 samples/s/p 0:01:51 } +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1551/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0018815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43603 samples/s/p 0:01:48 } +2024-07-26 01:12:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1553/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 1.0017839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:30,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43936 samples/s/p 0:01:45 } +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1555/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.0016853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43995 samples/s/p 0:01:42 } +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1557/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.0015929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43295 samples/s/p 0:01:40 } +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1559/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.0015021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43060 samples/s/p 0:01:37 } +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1561/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 1.0014131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.44202 samples/s/p 0:01:34 } +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1563/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.0013284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43570 samples/s/p 0:01:31 } +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1565/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.0012462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:48,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43554 samples/s/p 0:01:28 } +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1567/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0011634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43757 samples/s/p 0:01:25 } +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1569/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 1.0010881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43521 samples/s/p 0:01:22 } +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1571/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.001012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43628 samples/s/p 0:01:19 } +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1573/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.0009412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43931 samples/s/p 0:01:16 } +2024-07-26 01:13:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1575/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.0008712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:03,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43183 samples/s/p 0:01:13 } +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1577/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0008029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43684 samples/s/p 0:01:10 } +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1579/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 1.000738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43471 samples/s/p 0:01:07 } +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1581/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.0006768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43479 samples/s/p 0:01:04 } +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1583/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.000618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43356 samples/s/p 0:01:01 } +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1585/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.0005626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.44017 samples/s/p 0:00:58 } +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1587/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0005091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43111 samples/s/p 0:00:55 } +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1589/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.000458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.44171 samples/s/p 0:00:52 } +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1591/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0004088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:26,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43609 samples/s/p 0:00:50 } +2024-07-26 01:13:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1593/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0003639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:29,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43599 samples/s/p 0:00:47 } +2024-07-26 01:13:32,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1595/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.0003206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43346 samples/s/p 0:00:44 } +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1597/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.0002809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43564 samples/s/p 0:00:41 } +2024-07-26 01:13:38,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1599/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.0002437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:38,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43596 samples/s/p 0:00:38 } +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1601/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.0002083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42907 samples/s/p 0:00:35 } +2024-07-26 01:13:44,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1603/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.0001771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:44,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43665 samples/s/p 0:00:32 } +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1605/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.0001469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43738 samples/s/p 0:00:29 } +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1607/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0001202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43121 samples/s/p 0:00:26 } +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1609/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0000967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43457 samples/s/p 0:00:23 } +2024-07-26 01:13:56,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1611/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0000743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:56,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43583 samples/s/p 0:00:20 } +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1613/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0000579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43397 samples/s/p 0:00:17 } +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1615/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.0000398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42743 samples/s/p 0:00:14 } +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1617/ 1625], loss: 0.922, per_step_time: 1471ms, lr: 1.0000276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43570 samples/s/p 0:00:11 } +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1619/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0000164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:08,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43375 samples/s/p 0:00:08 } +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1621/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 1.0000086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:11,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43057 samples/s/p 0:00:05 } +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1623/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.0000026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43297 samples/s/p 0:00:02 } +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1625/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.0000009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:17,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |██████████████████████████████████████████████████| 5.43134 samples/s/p 0:00:00 } +2024-07-26 01:14:17,185 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 01:14:50,830 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_2.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_2.log" new file mode 100644 index 00000000..4d485bd5 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_2.log" @@ -0,0 +1,16899 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:19.408.600 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:20.408.943 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 2 +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:21.409.786 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:24.409.947 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:24.410.266 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 2 rank id: 2 +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:50.133.037 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DEVICE(62198,ffff8ce2e010,python):2024-07-25-18:09:50.133.634 [mindspore/ccsrc/plugin/device/cpu/hal/hardware/ms_collective_comm_lib.cc:200] QueryUniqueID] Retry to lookup the unique id for group hccl_world_group from the meta server node...Retry time: 199/200 +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:53.134.066 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(62198,ffff8ce2e010,python):2024-07-25-18:09:53.365.513 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-25 18:09:53,368 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_2.ckpt' +2024-07-25 18:09:53,402 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-25 18:09:53,403 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-25 18:09:53,403 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-25 18:09:53,403 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-25 18:09:53,404 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/MindFormers/mindformers/research/output' +2024-07-25 18:09:53,404 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-25 18:09:53,405 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,406 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-25 18:09:53,406 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-25 18:09:53,406 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-25 18:09:53,406 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-25 18:09:53,407 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-25 18:09:53,407 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-25 18:09:53,413 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:1625 +2024-07-25 18:09:53,414 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:10, sink_size:2 +2024-07-25 18:09:53,414 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:1625 +2024-07-25 18:09:53,414 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-25 18:09:53,415 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-25 18:09:53,415 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-25 18:09:53,416 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-25 18:09:53,416 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:09:53.418.031 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:09:53.420.624 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-25 18:09:53,522 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:09:53.523.963 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:09:53.524.096 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-25 18:09:53,544 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,565 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,586 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,607 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,628 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,648 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,669 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,690 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,711 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:54,181 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,377 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,400 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-25 18:09:54,400 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-25 18:09:54,400 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-25 18:09:54,400 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-25 18:09:54,406 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-25 18:09:54,409 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-25 18:09:54,509 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-25 18:09:54,509 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-25 18:09:54,515 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-25 18:09:54,517 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-25 18:09:54,518 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-25 18:09:54,519 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:19.684.610 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:24.760.489 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:24.761.490 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:24.762.077 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:24.909.834 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:24.951.283 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:25.240.3 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:25.165.445 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:25.755.568 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:26.347.595 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:26.937.803 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:26.938.672 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:26.939.120 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:27.103.877 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:27.146.524 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:27.189.272 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:27.354.871 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:27.929.600 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:28.512.984 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.892.64 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.901.03 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.905.51 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.265.931 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.420.887 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.494.302 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:29.668.412 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:30.250.209 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:30.834.360 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.404.507 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.405.338 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.405.786 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.582.628 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.626.832 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.671.225 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:31.849.982 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:32.420.342 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:32.994.260 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.581.223 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.587.457 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.588.058 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.755.172 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.798.540 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:33.839.579 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:34.657.5 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:34.589.917 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:35.175.836 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:35.832.092 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:35.833.089 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:35.833.610 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:36.825.2 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:36.487.25 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:36.898.06 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:36.272.657 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:36.853.805 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:37.494.683 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.922.93 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.932.71 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.937.89 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.275.592 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.316.895 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.356.601 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:38.534.781 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:39.134.929 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:39.724.438 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.314.008 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.314.872 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.315.413 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.493.285 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.538.046 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.586.422 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:40.767.369 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:41.345.473 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:41.961.505 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.620.899 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.622.000 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.622.552 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.799.486 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.879.104 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:42.927.957 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:43.162.522 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:43.770.662 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:44.359.441 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:44.966.234 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:44.967.337 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:44.967.870 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:45.143.066 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:45.195.564 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:45.245.747 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:45.415.811 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:45.997.200 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:46.594.404 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.193.479 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.194.443 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.194.998 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.364.472 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.411.076 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.460.699 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:47.639.334 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:48.240.783 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:48.831.108 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.463.611 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.464.430 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.464.993 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.640.329 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.689.269 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.733.948 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:49.912.367 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:50.488.268 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.552.92 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.656.327 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.657.395 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.657.964 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.869.959 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.918.369 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:51.966.996 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:52.142.040 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:52.718.658 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:53.331.668 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:53.925.077 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:53.926.521 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:53.927.137 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:54.126.432 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:54.202.583 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:54.259.483 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:54.499.081 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:55.116.296 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:55.731.088 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.331.906 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.332.895 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.333.437 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.517.071 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.568.406 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.640.237 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:56.817.476 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:57.403.810 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:57.978.079 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.545.487 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.546.499 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.547.053 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.718.418 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.767.617 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.816.696 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:58.994.577 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:11:59.580.796 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.165.681 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.755.545 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.756.483 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.757.097 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.937.549 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:00.991.096 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:01.403.77 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:01.228.492 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:01.813.041 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:02.395.162 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:02.978.571 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:02.979.501 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:02.980.024 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:03.157.544 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:03.206.545 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:03.258.064 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:03.435.386 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:04.228.28 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:04.616.499 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.196.398 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.197.310 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.197.847 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.376.958 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.429.028 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.479.034 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:05.654.421 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:06.497.944 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.642.07 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.674.906 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.675.777 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.676.217 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.898.541 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:07.969.065 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:08.421.74 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:08.216.752 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:08.868.124 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:09.456.642 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.681.54 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.693.85 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.699.47 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.275.649 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.327.477 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.377.797 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:10.560.819 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:11.180.794 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:11.785.226 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.398.379 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.399.331 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.399.795 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.581.171 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.634.495 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.684.851 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:12.867.840 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:13.488.057 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.977.97 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.682.630 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.683.467 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.683.905 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.859.083 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.912.003 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:14.963.722 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:15.155.379 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:15.751.539 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:16.327.795 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:16.935.807 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:16.936.736 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:16.937.223 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:17.156.004 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:17.218.163 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:17.270.604 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:17.489.383 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:18.782.46 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:18.665.452 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.249.207 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.250.358 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.250.838 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.450.244 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.506.307 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.557.034 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:19.749.404 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:20.356.368 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:20.953.048 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.540.700 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.542.009 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.542.522 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.737.713 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.787.310 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:21.840.012 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:22.310.88 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:22.650.165 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:23.241.650 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:23.794.692 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:23.795.653 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:23.796.180 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:23.972.189 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:24.473.11 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:24.948.89 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:24.276.596 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:24.910.630 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:25.513.209 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.144.078 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.144.990 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.145.509 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.371.210 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.446.820 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.495.705 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:26.680.453 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:27.271.021 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:27.850.059 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.435.718 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.436.700 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.437.333 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.636.989 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.687.979 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.735.330 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:28.916.505 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:29.491.820 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.789.36 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.706.494 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.707.425 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.707.930 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.889.126 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:30.959.507 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:31.131.49 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:31.216.832 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:31.851.095 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:32.450.761 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.344.97 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.353.97 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.358.99 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.240.474 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.293.932 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.343.891 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:33.551.003 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:34.152.657 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:34.789.811 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.388.922 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.389.926 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.390.443 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.575.589 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.625.952 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.675.964 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:35.858.133 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:36.450.343 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:37.393.66 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:37.618.724 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:12:37.619.713 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:02.731.246 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:02.735.490 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:09.899.086 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:09.902.840 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:17.520. [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:17.431.0 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:23.996.251 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:24.359. [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:31.459.16 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:31.497.72 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:38.649.67 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:38.687.86 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:45.745.05 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:45.784.03 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:52.482.81 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:52.521.75 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:59.754.13 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:13:59.792.15 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:06.864.67 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:06.902.34 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:13.123.885 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:13.127.666 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:20.173.952 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:20.177.915 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:27.293.326 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:27.297.313 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:34.344.019 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:34.347.907 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:41.401.786 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:41.405.682 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:48.417.622 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:48.421.520 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:55.511.848 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:14:55.515.659 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:02.584.863 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:02.588.675 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:09.577.437 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:09.581.533 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:16.631.624 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:16.635.539 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:23.639.659 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:23.643.569 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:30.683.902 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:30.687.822 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:37.719.448 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:37.723.535 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:44.813.015 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:44.816.840 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:51.888.208 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:51.892.184 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:58.937.179 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:15:58.941.054 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:05.924.331 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:05.928.365 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:12.983.290 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:12.987.159 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:20.106.55 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:20.145.88 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:27.663.48 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:27.702.15 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:34.659.71 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:34.702.96 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:41.119.148 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:41.123.019 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:16:48.158.944 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:17:05.595.927 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:17:05.596.468 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-25 18:17:05,597 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-25 18:17:05,598 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-25 18:17:05,599 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:17:05.600.558 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'epoch_end', 'epoch_begin', 'step_begin', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(62198:281473045422096,MainProcess):2024-07-25-18:17:05.600.752 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'epoch_end', 'step_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.761.966 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.762.718 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.763.393 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.764.065 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.764.738 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.765.421 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.766.126 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.766.787 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.767.454 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.768.117 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.768.776 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.769.439 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.770.091 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.770.739 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.771.407 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.772.054 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.772.707 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.773.360 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.774.012 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.774.660 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.775.313 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.775.958 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.776.619 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.777.293 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.777.949 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.778.586 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.779.235 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.779.856 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.780.483 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.781.130 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.781.814 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.782.463 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.782.915 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.783.626 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.784.352 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.785.076 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.785.831 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.786.574 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.787.331 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.788.062 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.788.778 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.789.530 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.790.257 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.790.976 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.791.698 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.792.415 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.793.134 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.793.857 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.794.571 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.795.291 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.795.984 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.796.674 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.797.390 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.798.077 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.798.773 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.799.445 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.800.086 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.800.721 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.801.360 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.802.005 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.802.638 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.803.274 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.803.923 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:32.804.553 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62198,ffff8ce2e010,python):2024-07-25-18:17:35.317.965 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | / - \ | 2024-07-25 18:28:34,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 2/ 1625], loss: 1.518, per_step_time: 343789ms, lr: 1.8461538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:34,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02327 samples/s/p 64 days, 15:38:14 } +2024-07-25 18:28:38,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 4/ 1625], loss: 1.444, per_step_time: 1587ms, lr: 5.538461e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.04055 samples/s/p 7:09:44 } +2024-07-25 18:28:41,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 6/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 9.230769e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:41,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.42918 samples/s/p 6:38:55 } +2024-07-25 18:28:44,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 8/ 1625], loss: 1.351, per_step_time: 1478ms, lr: 1.2923077e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:44,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.40922 samples/s/p 6:40:21 } +2024-07-25 18:28:47,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 10/ 1625], loss: 1.390, per_step_time: 1469ms, lr: 1.6615384e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:47,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.44291 samples/s/p 6:37:49 } +2024-07-25 18:28:50,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 12/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 2.0307691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:50,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43416 samples/s/p 6:38:25 } +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 14/ 1625], loss: 1.447, per_step_time: 1470ms, lr: 2.4e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43866 samples/s/p 6:38:02 } +2024-07-25 18:28:55,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 16/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.7692306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:55,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43206 samples/s/p 6:38:28 } +2024-07-25 18:28:58,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 18/ 1625], loss: 1.406, per_step_time: 1474ms, lr: 3.1384613e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42645 samples/s/p 6:38:50 } +2024-07-25 18:29:01,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 20/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 3.5076923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:01,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43357 samples/s/p 6:38:15 } +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 22/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 3.876923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42752 samples/s/p 6:38:39 } +2024-07-25 18:29:07,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 24/ 1625], loss: 1.562, per_step_time: 1471ms, lr: 4.2461537e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:07,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43635 samples/s/p 6:37:57 } +2024-07-25 18:29:10,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 26/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 4.6153846e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:10,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43674 samples/s/p 6:37:53 } +2024-07-25 18:29:13,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 28/ 1625], loss: 1.523, per_step_time: 1471ms, lr: 4.9846153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:13,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43652 samples/s/p 6:37:51 } +2024-07-25 18:29:16,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 30/ 1625], loss: 1.471, per_step_time: 1473ms, lr: 5.3538463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42893 samples/s/p 6:38:21 } +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 32/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 5.7230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43644 samples/s/p 6:37:45 } +2024-07-25 18:29:22,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 34/ 1625], loss: 1.483, per_step_time: 1472ms, lr: 6.092307e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:22,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43471 samples/s/p 6:37:50 } +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 36/ 1625], loss: 1.478, per_step_time: 1471ms, lr: 6.461538e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43505 samples/s/p 6:37:45 } +2024-07-25 18:29:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 38/ 1625], loss: 1.330, per_step_time: 1474ms, lr: 6.8307685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42654 samples/s/p 6:38:20 } +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 40/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 7.2e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42643 samples/s/p 6:38:17 } +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 42/ 1625], loss: 1.627, per_step_time: 1473ms, lr: 7.5692304e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42943 samples/s/p 6:38:01 } +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 44/ 1625], loss: 1.519, per_step_time: 1470ms, lr: 7.9384614e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43960 samples/s/p 6:37:14 } +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 46/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 8.307692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:40,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42809 samples/s/p 6:38:01 } +2024-07-25 18:29:43,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 48/ 1625], loss: 1.576, per_step_time: 1471ms, lr: 8.676922e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:43,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43623 samples/s/p 6:37:23 } +2024-07-25 18:29:46,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 50/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 9.046154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:46,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42767 samples/s/p 6:37:57 } +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 52/ 1625], loss: 1.520, per_step_time: 1472ms, lr: 9.4153836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43200 samples/s/p 6:37:35 } +2024-07-25 18:29:52,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 54/ 1625], loss: 1.476, per_step_time: 1473ms, lr: 9.784615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:52,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42955 samples/s/p 6:37:43 } +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 56/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.0153847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43124 samples/s/p 6:37:33 } +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 58/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 1.0523077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42769 samples/s/p 6:37:45 } +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 60/ 1625], loss: 1.523, per_step_time: 1473ms, lr: 1.0892308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42745 samples/s/p 6:37:43 } +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 62/ 1625], loss: 1.416, per_step_time: 1473ms, lr: 1.1261538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43024 samples/s/p 6:37:28 } +2024-07-25 18:30:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 64/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.1630768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43105 samples/s/p 6:37:22 } +2024-07-25 18:30:09,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 66/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 1.1999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43407 samples/s/p 6:37:05 } +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 68/ 1625], loss: 1.436, per_step_time: 1471ms, lr: 1.236923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43620 samples/s/p 6:36:53 } +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 70/ 1625], loss: 1.423, per_step_time: 1471ms, lr: 1.2738461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43776 samples/s/p 6:36:43 } +2024-07-25 18:30:18,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 72/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.3107691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:18,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43665 samples/s/p 6:36:45 } +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 74/ 1625], loss: 1.433, per_step_time: 1475ms, lr: 1.3476922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42245 samples/s/p 6:37:45 } +2024-07-25 18:30:24,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 76/ 1625], loss: 1.482, per_step_time: 1472ms, lr: 1.3846154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:24,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43204 samples/s/p 6:37:00 } +2024-07-25 18:30:27,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 78/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.4215384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42813 samples/s/p 6:37:14 } +2024-07-25 18:30:30,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 80/ 1625], loss: 1.323, per_step_time: 1474ms, lr: 1.4584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42734 samples/s/p 6:37:14 } +2024-07-25 18:30:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 82/ 1625], loss: 1.471, per_step_time: 1472ms, lr: 1.4953846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43261 samples/s/p 6:36:48 } +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 84/ 1625], loss: 1.493, per_step_time: 1472ms, lr: 1.5323077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43345 samples/s/p 6:36:42 } +2024-07-25 18:30:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 86/ 1625], loss: 1.431, per_step_time: 1473ms, lr: 1.5692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:39,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42963 samples/s/p 6:36:56 } +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 88/ 1625], loss: 1.613, per_step_time: 1471ms, lr: 1.6061538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43655 samples/s/p 6:36:22 } +2024-07-25 18:30:45,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 90/ 1625], loss: 1.673, per_step_time: 1483ms, lr: 1.6430769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.39357 samples/s/p 6:39:29 } +2024-07-25 18:30:48,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 92/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 1.6799999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43646 samples/s/p 6:36:17 } +2024-07-25 18:30:51,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 94/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.716923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:51,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43676 samples/s/p 6:36:12 } +2024-07-25 18:30:54,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 96/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.753846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43646 samples/s/p 6:36:11 } +2024-07-25 18:30:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 98/ 1625], loss: 1.372, per_step_time: 1470ms, lr: 1.7907691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.44001 samples/s/p 6:35:52 } +2024-07-25 18:30:59,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 100/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.8276922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:59,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43830 samples/s/p 6:35:57 } +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 102/ 1625], loss: 1.413, per_step_time: 1472ms, lr: 1.8646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43311 samples/s/p 6:36:17 } +2024-07-25 18:31:05,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 104/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.9015384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43197 samples/s/p 6:36:19 } +2024-07-25 18:31:08,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 106/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.9384615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.42665 samples/s/p 6:36:39 } +2024-07-25 18:31:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 108/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 1.9753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43479 samples/s/p 6:36:00 } +2024-07-25 18:31:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 110/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.0123075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:14,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43702 samples/s/p 6:35:48 } +2024-07-25 18:31:17,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 112/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.0492307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43745 samples/s/p 6:35:43 } +2024-07-25 18:31:20,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 114/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.0861537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:20,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43891 samples/s/p 6:35:34 } +2024-07-25 18:31:23,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 116/ 1625], loss: 1.443, per_step_time: 1471ms, lr: 2.1230767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:23,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43652 samples/s/p 6:35:41 } +2024-07-25 18:31:26,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 118/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.16e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43582 samples/s/p 6:35:41 } +2024-07-25 18:31:29,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 120/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.1969229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:29,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43241 samples/s/p 6:35:53 } +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 122/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 2.233846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43261 samples/s/p 6:35:49 } +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 124/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 2.270769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43452 samples/s/p 6:35:38 } +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 126/ 1625], loss: 1.199, per_step_time: 1475ms, lr: 2.307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42226 samples/s/p 6:36:29 } +2024-07-25 18:31:41,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 128/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.3446153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:41,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43651 samples/s/p 6:35:24 } +2024-07-25 18:31:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 130/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.3815385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42524 samples/s/p 6:36:10 } +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 132/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 2.4184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43551 samples/s/p 6:35:22 } +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 134/ 1625], loss: 1.484, per_step_time: 1472ms, lr: 2.4553847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43417 samples/s/p 6:35:25 } +2024-07-25 18:31:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 136/ 1625], loss: 1.322, per_step_time: 1473ms, lr: 2.4923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:53,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42900 samples/s/p 6:35:45 } +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 138/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.5292306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43439 samples/s/p 6:35:18 } +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 140/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 2.5661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43348 samples/s/p 6:35:19 } +2024-07-25 18:32:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 142/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6030768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:01,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43206 samples/s/p 6:35:22 } +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 144/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.6399998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43309 samples/s/p 6:35:15 } +2024-07-25 18:32:07,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 146/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.676923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43370 samples/s/p 6:35:09 } +2024-07-25 18:32:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 148/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.713846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:10,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43142 samples/s/p 6:35:16 } +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 150/ 1625], loss: 1.384, per_step_time: 1470ms, lr: 2.7507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43989 samples/s/p 6:34:36 } +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 152/ 1625], loss: 1.442, per_step_time: 1471ms, lr: 2.7876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43754 samples/s/p 6:34:44 } +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 154/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8246152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:19,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43187 samples/s/p 6:35:06 } +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 156/ 1625], loss: 1.473, per_step_time: 1470ms, lr: 2.8615384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.44046 samples/s/p 6:34:25 } +2024-07-25 18:32:25,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 158/ 1625], loss: 1.352, per_step_time: 1471ms, lr: 2.8984614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43533 samples/s/p 6:34:45 } +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 160/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9353844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.42799 samples/s/p 6:35:14 } +2024-07-25 18:32:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 162/ 1625], loss: 1.487, per_step_time: 1472ms, lr: 2.9723076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43341 samples/s/p 6:34:47 } +2024-07-25 18:32:34,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 164/ 1625], loss: 1.285, per_step_time: 1470ms, lr: 3.0092306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:34,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43889 samples/s/p 6:34:20 } +2024-07-25 18:32:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 166/ 1625], loss: 1.387, per_step_time: 1472ms, lr: 3.0461536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43402 samples/s/p 6:34:38 } +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 168/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 3.0830768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43686 samples/s/p 6:34:23 } +2024-07-25 18:32:43,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 170/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 3.1199997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:43,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43064 samples/s/p 6:34:47 } +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 172/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 3.156923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43352 samples/s/p 6:34:32 } +2024-07-25 18:32:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 174/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.1938462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:49,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43182 samples/s/p 6:34:36 } +2024-07-25 18:32:52,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 176/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 3.2307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:52,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43300 samples/s/p 6:34:28 } +2024-07-25 18:32:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 178/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 3.2676921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43491 samples/s/p 6:34:17 } +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 180/ 1625], loss: 1.463, per_step_time: 1472ms, lr: 3.3046153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43409 samples/s/p 6:34:18 } +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 182/ 1625], loss: 1.410, per_step_time: 1473ms, lr: 3.3415383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42969 samples/s/p 6:34:34 } +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 184/ 1625], loss: 1.516, per_step_time: 1471ms, lr: 3.3784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43809 samples/s/p 6:33:54 } +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 186/ 1625], loss: 1.353, per_step_time: 1473ms, lr: 3.4153845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42863 samples/s/p 6:34:32 } +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 188/ 1625], loss: 1.366, per_step_time: 1471ms, lr: 3.4523075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43590 samples/s/p 6:33:58 } +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 190/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 3.4892307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43173 samples/s/p 6:34:13 } +2024-07-25 18:33:15,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 192/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 3.5261537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:15,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.42802 samples/s/p 6:34:26 } +2024-07-25 18:33:18,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 194/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 3.5630767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43273 samples/s/p 6:34:03 } +2024-07-25 18:33:21,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 196/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 3.6e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:21,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43469 samples/s/p 6:33:51 } +2024-07-25 18:33:24,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 198/ 1625], loss: 1.411, per_step_time: 1472ms, lr: 3.6369229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:24,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43206 samples/s/p 6:34:00 } +2024-07-25 18:33:27,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 200/ 1625], loss: 1.502, per_step_time: 1472ms, lr: 3.6738459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:27,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43458 samples/s/p 6:33:46 } +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 202/ 1625], loss: 1.411, per_step_time: 1471ms, lr: 3.710769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43548 samples/s/p 6:33:39 } +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 204/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.747692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43336 samples/s/p 6:33:45 } +2024-07-25 18:33:36,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 206/ 1625], loss: 1.352, per_step_time: 1473ms, lr: 3.784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:36,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42850 samples/s/p 6:34:04 } +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 208/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 3.8215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43480 samples/s/p 6:33:33 } +2024-07-25 18:33:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 210/ 1625], loss: 1.391, per_step_time: 1473ms, lr: 3.8584612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42984 samples/s/p 6:33:52 } +2024-07-25 18:33:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 212/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 3.8953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43870 samples/s/p 6:33:10 } +2024-07-25 18:33:48,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 214/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 3.932307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:48,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42622 samples/s/p 6:34:02 } +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 216/ 1625], loss: 1.471, per_step_time: 1470ms, lr: 3.969231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:51,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.44038 samples/s/p 6:32:57 } +2024-07-25 18:33:54,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 218/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 4.0061536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42848 samples/s/p 6:33:46 } +2024-07-25 18:33:57,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 220/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.043077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:57,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43715 samples/s/p 6:33:05 } +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 222/ 1625], loss: 1.240, per_step_time: 1474ms, lr: 4.0799996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42606 samples/s/p 6:33:51 } +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 224/ 1625], loss: 1.427, per_step_time: 1471ms, lr: 4.116923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43665 samples/s/p 6:33:02 } +2024-07-25 18:34:05,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 226/ 1625], loss: 1.358, per_step_time: 1471ms, lr: 4.153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:05,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43710 samples/s/p 6:32:57 } +2024-07-25 18:34:08,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 228/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.1907692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:08,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43448 samples/s/p 6:33:05 } +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 230/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 4.227692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42581 samples/s/p 6:33:40 } +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 232/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.264615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43151 samples/s/p 6:33:12 } +2024-07-25 18:34:17,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 234/ 1625], loss: 1.391, per_step_time: 1472ms, lr: 4.301538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:17,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43211 samples/s/p 6:33:07 } +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 236/ 1625], loss: 1.328, per_step_time: 1474ms, lr: 4.338461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42451 samples/s/p 6:33:37 } +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 238/ 1625], loss: 1.468, per_step_time: 1471ms, lr: 4.375385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43564 samples/s/p 6:32:45 } +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 240/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 4.4123076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43388 samples/s/p 6:32:50 } +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 242/ 1625], loss: 1.520, per_step_time: 1475ms, lr: 4.449231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42210 samples/s/p 6:33:38 } +2024-07-25 18:34:32,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 244/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 4.4861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:32,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42880 samples/s/p 6:33:06 } +2024-07-25 18:34:35,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 246/ 1625], loss: 1.449, per_step_time: 1473ms, lr: 4.5230768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43019 samples/s/p 6:32:57 } +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 248/ 1625], loss: 1.269, per_step_time: 1470ms, lr: 4.5599995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43939 samples/s/p 6:32:14 } +2024-07-25 18:34:41,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 250/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 4.596923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:41,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43006 samples/s/p 6:32:52 } +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 252/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 4.633846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43563 samples/s/p 6:32:25 } +2024-07-25 18:34:47,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 254/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 4.670769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:47,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43159 samples/s/p 6:32:39 } +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 256/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 4.707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.44303 samples/s/p 6:31:47 } +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 258/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 4.744615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43496 samples/s/p 6:32:19 } +2024-07-25 18:34:56,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 260/ 1625], loss: 1.525, per_step_time: 1471ms, lr: 4.7815383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:56,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43694 samples/s/p 6:32:07 } +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 262/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.8184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43241 samples/s/p 6:32:24 } +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 264/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 4.8553843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43129 samples/s/p 6:32:26 } +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 266/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 4.8923075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43260 samples/s/p 6:32:17 } +2024-07-25 18:35:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 268/ 1625], loss: 1.425, per_step_time: 1472ms, lr: 4.9292303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:07,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43179 samples/s/p 6:32:18 } +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 270/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.9661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43533 samples/s/p 6:32:00 } +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 272/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 5.0030767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43453 samples/s/p 6:32:00 } +2024-07-25 18:35:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 274/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 5.04e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43005 samples/s/p 6:32:17 } +2024-07-25 18:35:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 276/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 5.0769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43462 samples/s/p 6:31:54 } +2024-07-25 18:35:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 278/ 1625], loss: 1.270, per_step_time: 1475ms, lr: 5.113846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.42369 samples/s/p 6:32:38 } +2024-07-25 18:35:25,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 280/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 5.150769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:25,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43659 samples/s/p 6:31:40 } +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 282/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 5.187692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43486 samples/s/p 6:31:44 } +2024-07-25 18:35:31,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 284/ 1625], loss: 1.393, per_step_time: 1472ms, lr: 5.2246155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:31,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43457 samples/s/p 6:31:42 } +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 286/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 5.2615383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43674 samples/s/p 6:31:30 } +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 288/ 1625], loss: 1.358, per_step_time: 1472ms, lr: 5.2984615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:37,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43412 samples/s/p 6:31:38 } +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 290/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 5.3353842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43756 samples/s/p 6:31:21 } +2024-07-25 18:35:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 292/ 1625], loss: 1.333, per_step_time: 1473ms, lr: 5.3723074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42791 samples/s/p 6:31:59 } +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 294/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 5.4092307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42632 samples/s/p 6:32:03 } +2024-07-25 18:35:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 296/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 5.446154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:49,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43499 samples/s/p 6:31:23 } +2024-07-25 18:35:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 298/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 5.4830766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:52,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43314 samples/s/p 6:31:28 } +2024-07-25 18:35:55,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 300/ 1625], loss: 1.461, per_step_time: 1473ms, lr: 5.52e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:55,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42942 samples/s/p 6:31:41 } +2024-07-25 18:35:58,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 302/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 5.5569226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:58,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43799 samples/s/p 6:31:01 } +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 304/ 1625], loss: 1.507, per_step_time: 1472ms, lr: 5.593846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43339 samples/s/p 6:31:18 } +2024-07-25 18:36:04,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 306/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 5.630769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:04,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43727 samples/s/p 6:30:58 } +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 308/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 5.667692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43703 samples/s/p 6:30:56 } +2024-07-25 18:36:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 310/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 5.704615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:09,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43615 samples/s/p 6:30:57 } +2024-07-25 18:36:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 312/ 1625], loss: 1.359, per_step_time: 1472ms, lr: 5.741538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:12,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43145 samples/s/p 6:31:15 } +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 314/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 5.778461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43721 samples/s/p 6:30:47 } +2024-07-25 18:36:18,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 316/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 5.8153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:18,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43754 samples/s/p 6:30:42 } +2024-07-25 18:36:21,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 318/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 5.8523074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43715 samples/s/p 6:30:41 } +2024-07-25 18:36:24,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 320/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 5.8892306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:24,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43231 samples/s/p 6:30:59 } +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 5.926154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43194 samples/s/p 6:30:58 } +2024-07-25 18:36:30,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 324/ 1625], loss: 1.425, per_step_time: 1470ms, lr: 5.9630765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:30,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43925 samples/s/p 6:30:23 } +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 326/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 5.9999998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.44096 samples/s/p 6:30:13 } +2024-07-25 18:36:36,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 328/ 1625], loss: 1.466, per_step_time: 1472ms, lr: 6.036923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:36,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43210 samples/s/p 6:30:48 } +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 330/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 6.073846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43677 samples/s/p 6:30:25 } +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 332/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 6.110769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43145 samples/s/p 6:30:45 } +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 334/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 6.147692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43322 samples/s/p 6:30:35 } +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 336/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 6.184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43209 samples/s/p 6:30:37 } +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 338/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 6.221538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43616 samples/s/p 6:30:16 } +2024-07-25 18:36:54,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 340/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 6.2584613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.42955 samples/s/p 6:30:42 } +2024-07-25 18:36:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 342/ 1625], loss: 1.366, per_step_time: 1470ms, lr: 6.2953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:57,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43860 samples/s/p 6:30:00 } +2024-07-25 18:37:00,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 344/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.3323073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:00,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43115 samples/s/p 6:30:29 } +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 346/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 6.3692305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43074 samples/s/p 6:30:28 } +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 348/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 6.4061533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43250 samples/s/p 6:30:17 } +2024-07-25 18:37:08,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 350/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 6.443077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:08,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43738 samples/s/p 6:29:53 } +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 352/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 6.4799997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43322 samples/s/p 6:30:08 } +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 354/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 6.516923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42760 samples/s/p 6:30:29 } +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 356/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 6.5538457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43872 samples/s/p 6:29:39 } +2024-07-25 18:37:20,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 358/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 6.590769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:20,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43373 samples/s/p 6:29:57 } +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 360/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 6.6276916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42613 samples/s/p 6:30:27 } +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 362/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 6.6646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43450 samples/s/p 6:29:48 } +2024-07-25 18:37:29,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 364/ 1625], loss: 1.370, per_step_time: 1474ms, lr: 6.7015385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:29,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42671 samples/s/p 6:30:18 } +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 366/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 6.7384613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43725 samples/s/p 6:29:30 } +2024-07-25 18:37:35,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 368/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 6.7753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:35,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43041 samples/s/p 6:29:57 } +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 370/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 6.812307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:38,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43875 samples/s/p 6:29:18 } +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 372/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 6.8492304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43733 samples/s/p 6:29:21 } +2024-07-25 18:37:44,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 374/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 6.8861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:44,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43612 samples/s/p 6:29:23 } +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 376/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 6.923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43781 samples/s/p 6:29:13 } +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 378/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 6.9599996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43495 samples/s/p 6:29:22 } +2024-07-25 18:37:53,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 380/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 6.996923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43837 samples/s/p 6:29:05 } +2024-07-25 18:37:56,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 382/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 7.0338456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:56,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42951 samples/s/p 6:29:40 } +2024-07-25 18:37:59,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 384/ 1625], loss: 1.384, per_step_time: 1473ms, lr: 7.0707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:59,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42878 samples/s/p 6:29:40 } +2024-07-25 18:38:02,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 386/ 1625], loss: 1.272, per_step_time: 1474ms, lr: 7.107692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:02,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42419 samples/s/p 6:29:57 } +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 388/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 7.144615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43691 samples/s/p 6:28:59 } +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 390/ 1625], loss: 1.440, per_step_time: 1471ms, lr: 7.181538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43659 samples/s/p 6:28:58 } +2024-07-25 18:38:10,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 392/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 7.218461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:10,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43770 samples/s/p 6:28:50 } +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 394/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 7.255384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42902 samples/s/p 6:29:24 } +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 396/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 7.2923076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42911 samples/s/p 6:29:21 } +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 398/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 7.3292304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.44065 samples/s/p 6:28:28 } +2024-07-25 18:38:22,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 400/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 7.3661536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43111 samples/s/p 6:29:06 } +2024-07-25 18:38:25,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 402/ 1625], loss: 1.334, per_step_time: 1474ms, lr: 7.4030763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:25,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.42475 samples/s/p 6:29:31 } +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 404/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 7.4399995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43526 samples/s/p 6:28:43 } +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 406/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 7.4769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.44029 samples/s/p 6:28:18 } +2024-07-25 18:38:34,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 408/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 7.5138464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:34,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43284 samples/s/p 6:28:47 } +2024-07-25 18:38:37,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 410/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 7.5507687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:37,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43469 samples/s/p 6:28:36 } +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 412/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 7.587692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43599 samples/s/p 6:28:28 } +2024-07-25 18:38:43,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 414/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 7.624615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43946 samples/s/p 6:28:10 } +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 416/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 7.661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43925 samples/s/p 6:28:08 } +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 418/ 1625], loss: 1.314, per_step_time: 1470ms, lr: 7.698461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44165 samples/s/p 6:27:55 } +2024-07-25 18:38:52,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 420/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 7.735384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:52,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43635 samples/s/p 6:28:15 } +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 422/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 7.772307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44065 samples/s/p 6:27:53 } +2024-07-25 18:38:58,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 424/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 7.809231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:58,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.42513 samples/s/p 6:28:57 } +2024-07-25 18:39:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 426/ 1625], loss: 1.136, per_step_time: 1477ms, lr: 7.8461535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.41405 samples/s/p 6:29:42 } +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 428/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 7.883076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43057 samples/s/p 6:28:28 } +2024-07-25 18:39:07,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 430/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.92e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44292 samples/s/p 6:27:32 } +2024-07-25 18:39:09,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 432/ 1625], loss: 1.374, per_step_time: 1472ms, lr: 7.956923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43121 samples/s/p 6:28:19 } +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 434/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 7.993845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43782 samples/s/p 6:27:48 } +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 436/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 8.030769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.44243 samples/s/p 6:27:25 } +2024-07-25 18:39:18,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 438/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 8.067692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:18,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43166 samples/s/p 6:28:08 } +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 440/ 1625], loss: 1.366, per_step_time: 1471ms, lr: 8.1046155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43613 samples/s/p 6:27:46 } +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 442/ 1625], loss: 1.638, per_step_time: 1472ms, lr: 8.141537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43447 samples/s/p 6:27:50 } +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 444/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.178461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43799 samples/s/p 6:27:32 } +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 446/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43695 samples/s/p 6:27:34 } +2024-07-25 18:39:33,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 448/ 1625], loss: 1.467, per_step_time: 1472ms, lr: 8.252307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:33,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43146 samples/s/p 6:27:54 } +2024-07-25 18:39:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 450/ 1625], loss: 1.318, per_step_time: 1473ms, lr: 8.289231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42924 samples/s/p 6:28:01 } +2024-07-25 18:39:39,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 452/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 8.326153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:39,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.44080 samples/s/p 6:27:08 } +2024-07-25 18:39:42,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 454/ 1625], loss: 1.189, per_step_time: 1481ms, lr: 8.363077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.39846 samples/s/p 6:30:08 } +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 456/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.399999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43268 samples/s/p 6:27:37 } +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 458/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 8.436923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42749 samples/s/p 6:27:57 } +2024-07-25 18:39:51,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 460/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 8.473846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:51,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43538 samples/s/p 6:27:20 } +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 462/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 8.510769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43028 samples/s/p 6:27:39 } +2024-07-25 18:39:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 464/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 8.547692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:57,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43757 samples/s/p 6:27:05 } +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 466/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 8.584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43685 samples/s/p 6:27:05 } +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 468/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 8.621538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43728 samples/s/p 6:27:00 } +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 470/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.658461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43653 samples/s/p 6:27:00 } +2024-07-25 18:40:09,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 472/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 8.695384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:09,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43429 samples/s/p 6:27:07 } +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 474/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 8.732308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:11,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43472 samples/s/p 6:27:02 } +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 476/ 1625], loss: 1.107, per_step_time: 1475ms, lr: 8.76923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42114 samples/s/p 6:27:57 } +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 478/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 8.806153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42948 samples/s/p 6:27:19 } +2024-07-25 18:40:20,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 480/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 8.843077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.44198 samples/s/p 6:26:22 } +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 482/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 8.88e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43180 samples/s/p 6:27:03 } +2024-07-25 18:40:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 484/ 1625], loss: 1.342, per_step_time: 1477ms, lr: 8.9169225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:26,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.41604 samples/s/p 6:28:07 } +2024-07-25 18:40:29,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 486/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 8.953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43805 samples/s/p 6:26:30 } +2024-07-25 18:40:32,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 488/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.990769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:32,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43138 samples/s/p 6:26:56 } +2024-07-25 18:40:35,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 490/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 9.027692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43791 samples/s/p 6:26:25 } +2024-07-25 18:40:38,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 492/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.064615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43283 samples/s/p 6:26:44 } +2024-07-25 18:40:41,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 494/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 9.101538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43455 samples/s/p 6:26:33 } +2024-07-25 18:40:44,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 496/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 9.138461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43804 samples/s/p 6:26:15 } +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 498/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.175385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43179 samples/s/p 6:26:39 } +2024-07-25 18:40:50,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 500/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 9.212307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43500 samples/s/p 6:26:23 } +2024-07-25 18:40:53,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 502/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 9.24923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:53,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43105 samples/s/p 6:26:36 } +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 504/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 9.286154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43058 samples/s/p 6:26:36 } +2024-07-25 18:40:59,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 506/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 9.3230765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43283 samples/s/p 6:26:23 } +2024-07-25 18:41:02,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 508/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 9.36e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43838 samples/s/p 6:25:56 } +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 510/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 9.396922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43725 samples/s/p 6:25:58 } +2024-07-25 18:41:08,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 512/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 9.433846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:08,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44195 samples/s/p 6:25:35 } +2024-07-25 18:41:11,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 514/ 1625], loss: 1.214, per_step_time: 1474ms, lr: 9.470769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:11,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42556 samples/s/p 6:26:42 } +2024-07-25 18:41:13,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 516/ 1625], loss: 1.314, per_step_time: 1480ms, lr: 9.507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:13,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.40219 samples/s/p 6:28:20 } +2024-07-25 18:41:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 518/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 9.544615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44155 samples/s/p 6:25:28 } +2024-07-25 18:41:19,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 520/ 1625], loss: 1.191, per_step_time: 1475ms, lr: 9.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:19,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42016 samples/s/p 6:26:57 } +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 522/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 9.618461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43410 samples/s/p 6:25:54 } +2024-07-25 18:41:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 524/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 9.655385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:25,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43562 samples/s/p 6:25:45 } +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 526/ 1625], loss: 1.433, per_step_time: 1472ms, lr: 9.692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43463 samples/s/p 6:25:46 } +2024-07-25 18:41:31,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 528/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 9.72923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43936 samples/s/p 6:25:23 } +2024-07-25 18:41:34,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 530/ 1625], loss: 1.409, per_step_time: 1471ms, lr: 9.766153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43829 samples/s/p 6:25:24 } +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 532/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 9.803077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43991 samples/s/p 6:25:15 } +2024-07-25 18:41:40,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 534/ 1625], loss: 1.323, per_step_time: 1470ms, lr: 9.839999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:40,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.44082 samples/s/p 6:25:08 } +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 536/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 9.876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43631 samples/s/p 6:25:24 } +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 538/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 9.913846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43280 samples/s/p 6:25:36 } +2024-07-25 18:41:49,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 540/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 9.950769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:49,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43833 samples/s/p 6:25:10 } +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 542/ 1625], loss: 1.315, per_step_time: 1475ms, lr: 9.9876925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.42105 samples/s/p 6:26:20 } +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 544/ 1625], loss: 1.386, per_step_time: 1472ms, lr: 1.0024614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43284 samples/s/p 6:25:27 } +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 546/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 1.0061538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43288 samples/s/p 6:25:24 } +2024-07-25 18:42:01,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 548/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.0098462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43319 samples/s/p 6:25:20 } +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 550/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.0135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43344 samples/s/p 6:25:16 } +2024-07-25 18:42:07,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 552/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.0172307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:07,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43621 samples/s/p 6:25:01 } +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 554/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.020923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43557 samples/s/p 6:25:01 } +2024-07-25 18:42:12,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 556/ 1625], loss: 1.024, per_step_time: 1473ms, lr: 1.0246154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.42987 samples/s/p 6:25:22 } +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 558/ 1625], loss: 1.404, per_step_time: 1472ms, lr: 1.0283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43136 samples/s/p 6:25:13 } +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 560/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 1.0319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43165 samples/s/p 6:25:08 } +2024-07-25 18:42:21,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 562/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.0356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:21,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43371 samples/s/p 6:24:57 } +2024-07-25 18:42:24,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 564/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 1.03938455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:24,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43995 samples/s/p 6:24:27 } +2024-07-25 18:42:27,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 566/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.0430769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43795 samples/s/p 6:24:33 } +2024-07-25 18:42:30,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 568/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43635 samples/s/p 6:24:37 } +2024-07-25 18:42:33,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 570/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:33,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43230 samples/s/p 6:24:51 } +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 572/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.0541538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42849 samples/s/p 6:25:04 } +2024-07-25 18:42:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 574/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.0578461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:39,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43189 samples/s/p 6:24:47 } +2024-07-25 18:42:42,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 576/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 1.0615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:42,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42714 samples/s/p 6:25:04 } +2024-07-25 18:42:45,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 578/ 1625], loss: 1.248, per_step_time: 1475ms, lr: 1.0652307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42055 samples/s/p 6:25:29 } +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 580/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.068923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43404 samples/s/p 6:24:29 } +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 582/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.0726154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43427 samples/s/p 6:24:25 } +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 584/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.0763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43599 samples/s/p 6:24:15 } +2024-07-25 18:42:57,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 586/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.07999995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:57,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43786 samples/s/p 6:24:04 } +2024-07-25 18:43:00,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 588/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0836922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:00,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43627 samples/s/p 6:24:08 } +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 590/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 1.0873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:03,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43012 samples/s/p 6:24:31 } +2024-07-25 18:43:06,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 592/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.091077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:06,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43707 samples/s/p 6:23:58 } +2024-07-25 18:43:09,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 594/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 1.0947691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43222 samples/s/p 6:24:16 } +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 596/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.0984615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42857 samples/s/p 6:24:29 } +2024-07-25 18:43:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 598/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.1021538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43462 samples/s/p 6:24:00 } +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 600/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.10584615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42948 samples/s/p 6:24:19 } +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 602/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.1095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43677 samples/s/p 6:23:45 } +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 604/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.1132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43842 samples/s/p 6:23:35 } +2024-07-25 18:43:26,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 606/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.1169231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:26,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43707 samples/s/p 6:23:38 } +2024-07-25 18:43:29,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 608/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.1206153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43474 samples/s/p 6:23:45 } +2024-07-25 18:43:32,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 610/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.1243076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:32,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43698 samples/s/p 6:23:32 } +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 612/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.1279999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43499 samples/s/p 6:23:38 } +2024-07-25 18:43:38,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 614/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.1316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:38,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43389 samples/s/p 6:23:39 } +2024-07-25 18:43:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 616/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1353846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:41,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43634 samples/s/p 6:23:26 } +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 618/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.1390768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43620 samples/s/p 6:23:24 } +2024-07-25 18:43:47,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 620/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.1427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:47,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43255 samples/s/p 6:23:36 } +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 622/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 1.14646145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43334 samples/s/p 6:23:30 } +2024-07-25 18:43:53,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 624/ 1625], loss: 1.160, per_step_time: 1475ms, lr: 1.1501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:53,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.42309 samples/s/p 6:24:11 } +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 626/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.1538462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44012 samples/s/p 6:22:55 } +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 628/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.1575384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43472 samples/s/p 6:23:15 } +2024-07-25 18:44:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 630/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 1.1612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:02,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43182 samples/s/p 6:23:25 } +2024-07-25 18:44:05,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 632/ 1625], loss: 1.094, per_step_time: 1476ms, lr: 1.164923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:05,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.41980 samples/s/p 6:24:13 } +2024-07-25 18:44:08,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 634/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.1686154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:08,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43464 samples/s/p 6:23:07 } +2024-07-25 18:44:11,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 636/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.1723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43485 samples/s/p 6:23:03 } +2024-07-25 18:44:14,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 638/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.1759999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43440 samples/s/p 6:23:02 } +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 640/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.1796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44126 samples/s/p 6:22:30 } +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 642/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:19,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43484 samples/s/p 6:22:54 } +2024-07-25 18:44:22,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 644/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 1.18707685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:22,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43264 samples/s/p 6:23:01 } +2024-07-25 18:44:25,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 646/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 1.1907691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.44047 samples/s/p 6:22:25 } +2024-07-25 18:44:28,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 648/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 1.1944615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:28,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43690 samples/s/p 6:22:37 } +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 650/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.1981539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43612 samples/s/p 6:22:37 } +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 652/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.201846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43038 samples/s/p 6:22:58 } +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 654/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.2055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43369 samples/s/p 6:22:41 } +2024-07-25 18:44:40,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 656/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.2092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:40,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43689 samples/s/p 6:22:25 } +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 658/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.21292305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43298 samples/s/p 6:22:39 } +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 660/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.2166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43907 samples/s/p 6:22:10 } +2024-07-25 18:44:49,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 662/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.2203076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42959 samples/s/p 6:22:47 } +2024-07-25 18:44:52,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 664/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 1.224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:52,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.44118 samples/s/p 6:21:55 } +2024-07-25 18:44:55,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 666/ 1625], loss: 1.153, per_step_time: 1474ms, lr: 1.22769225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42548 samples/s/p 6:22:58 } +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 668/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.2313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43436 samples/s/p 6:22:18 } +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 670/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2350769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43299 samples/s/p 6:22:21 } +2024-07-25 18:45:04,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 672/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.2387692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:04,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43174 samples/s/p 6:22:23 } +2024-07-25 18:45:07,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 674/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.2424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43581 samples/s/p 6:22:03 } +2024-07-25 18:45:10,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 676/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.2461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:10,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43185 samples/s/p 6:22:17 } +2024-07-25 18:45:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 678/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2498461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43300 samples/s/p 6:22:09 } +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 680/ 1625], loss: 1.174, per_step_time: 1481ms, lr: 1.2535384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.40079 samples/s/p 6:24:23 } +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 682/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 1.2572307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43893 samples/s/p 6:21:38 } +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 684/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.2609231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43908 samples/s/p 6:21:35 } +2024-07-25 18:45:24,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 686/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:24,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43879 samples/s/p 6:21:33 } +2024-07-25 18:45:27,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 688/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2683076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43585 samples/s/p 6:21:42 } +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 690/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.2719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:30,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43524 samples/s/p 6:21:42 } +2024-07-25 18:45:33,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 692/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.2756923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:33,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43891 samples/s/p 6:21:24 } +2024-07-25 18:45:36,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 694/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.2793846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:36,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42891 samples/s/p 6:22:03 } +2024-07-25 18:45:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 696/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 1.2830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:39,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43653 samples/s/p 6:21:28 } +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 698/ 1625], loss: 1.554, per_step_time: 1473ms, lr: 1.2867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42957 samples/s/p 6:21:54 } +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 700/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.2904615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43844 samples/s/p 6:21:14 } +2024-07-25 18:45:48,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 702/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 1.29415375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:48,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43984 samples/s/p 6:21:05 } +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 704/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.2978461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:51,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43166 samples/s/p 6:21:36 } +2024-07-25 18:45:54,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 706/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:54,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43666 samples/s/p 6:21:12 } +2024-07-25 18:45:57,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 708/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.3052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:57,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42875 samples/s/p 6:21:43 } +2024-07-25 18:46:00,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 710/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.308923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43396 samples/s/p 6:21:18 } +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 712/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 1.3126153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43247 samples/s/p 6:21:21 } +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 714/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 1.3163076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43114 samples/s/p 6:21:24 } +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 716/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.32e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43718 samples/s/p 6:20:55 } +2024-07-25 18:46:12,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 718/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.3236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:12,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43652 samples/s/p 6:20:55 } +2024-07-25 18:46:15,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 720/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 1.3273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42718 samples/s/p 6:21:32 } +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 722/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.3310769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42843 samples/s/p 6:21:23 } +2024-07-25 18:46:20,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 724/ 1625], loss: 1.268, per_step_time: 1473ms, lr: 1.33476915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42765 samples/s/p 6:21:24 } +2024-07-25 18:46:23,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 726/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.3384615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43677 samples/s/p 6:20:42 } +2024-07-25 18:46:26,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 728/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 1.3421538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:26,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43860 samples/s/p 6:20:32 } +2024-07-25 18:46:29,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 730/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 1.3458461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:29,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43882 samples/s/p 6:20:28 } +2024-07-25 18:46:32,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 732/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3495384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:32,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42888 samples/s/p 6:21:07 } +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 734/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.3532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43510 samples/s/p 6:20:38 } +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 736/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43674 samples/s/p 6:20:28 } +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 738/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.36061535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43295 samples/s/p 6:20:41 } +2024-07-25 18:46:44,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 740/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.3643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.42982 samples/s/p 6:20:51 } +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 742/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43799 samples/s/p 6:20:14 } +2024-07-25 18:46:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 744/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 1.3716922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:50,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43173 samples/s/p 6:20:37 } +2024-07-25 18:46:53,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 746/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.3753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:53,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.44188 samples/s/p 6:19:52 } +2024-07-25 18:46:56,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 748/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.3790768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43408 samples/s/p 6:20:21 } +2024-07-25 18:46:59,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 750/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3827692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:59,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43506 samples/s/p 6:20:14 } +2024-07-25 18:47:02,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 752/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.38646155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:02,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43869 samples/s/p 6:19:56 } +2024-07-25 18:47:05,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 754/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.3901537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:05,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43780 samples/s/p 6:19:57 } +2024-07-25 18:47:08,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 756/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.3938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:08,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43704 samples/s/p 6:19:57 } +2024-07-25 18:47:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 758/ 1625], loss: 1.241, per_step_time: 1480ms, lr: 1.3975384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.40279 samples/s/p 6:22:19 } +2024-07-25 18:47:14,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 760/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.40123075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.44094 samples/s/p 6:19:35 } +2024-07-25 18:47:17,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 762/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.404923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43279 samples/s/p 6:20:06 } +2024-07-25 18:47:19,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 764/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 1.4086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:19,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43552 samples/s/p 6:19:52 } +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 766/ 1625], loss: 1.412, per_step_time: 1472ms, lr: 1.4123077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43391 samples/s/p 6:19:56 } +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 768/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.4159999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43194 samples/s/p 6:20:01 } +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 770/ 1625], loss: 1.398, per_step_time: 1473ms, lr: 1.4196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.42757 samples/s/p 6:20:16 } +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 772/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.4233846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43238 samples/s/p 6:19:53 } +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 774/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 1.4270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43328 samples/s/p 6:19:46 } +2024-07-25 18:47:37,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 776/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 1.4307692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:37,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.42463 samples/s/p 6:20:20 } +2024-07-25 18:47:40,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 778/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 1.4344614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:40,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43432 samples/s/p 6:19:36 } +2024-07-25 18:47:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 780/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.4381538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:43,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43805 samples/s/p 6:19:18 } +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 782/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 1.44184605e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43388 samples/s/p 6:19:32 } +2024-07-25 18:47:49,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 784/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.4455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:49,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43542 samples/s/p 6:19:23 } +2024-07-25 18:47:52,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 786/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:52,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43178 samples/s/p 6:19:35 } +2024-07-25 18:47:55,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 788/ 1625], loss: 1.232, per_step_time: 1477ms, lr: 1.452923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:55,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.41401 samples/s/p 6:20:47 } +2024-07-25 18:47:58,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 790/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.4566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:58,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43221 samples/s/p 6:19:27 } +2024-07-25 18:48:01,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 792/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.4603076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:01,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43468 samples/s/p 6:19:14 } +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 794/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44132 samples/s/p 6:18:43 } +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 796/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.4676923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43271 samples/s/p 6:19:16 } +2024-07-25 18:48:10,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 798/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 1.4713845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:10,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43023 samples/s/p 6:19:24 } +2024-07-25 18:48:13,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 800/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 1.4750769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44187 samples/s/p 6:18:32 } +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 802/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.4787692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43099 samples/s/p 6:19:15 } +2024-07-25 18:48:19,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 804/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 1.48246145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:19,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.42773 samples/s/p 6:19:26 } +2024-07-25 18:48:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 806/ 1625], loss: 1.011, per_step_time: 1470ms, lr: 1.4861538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:21,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43919 samples/s/p 6:18:35 } +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 808/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4898461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43475 samples/s/p 6:18:50 } +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 810/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 1.4935385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43296 samples/s/p 6:18:55 } +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 812/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.4972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43512 samples/s/p 6:18:43 } +2024-07-25 18:48:33,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 814/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.500923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43672 samples/s/p 6:18:33 } +2024-07-25 18:48:36,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 816/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5046153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:36,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.44063 samples/s/p 6:18:14 } +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 818/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.50830765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42843 samples/s/p 6:19:02 } +2024-07-25 18:48:42,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 820/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42792 samples/s/p 6:19:01 } +2024-07-25 18:48:45,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 822/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5156923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:45,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43489 samples/s/p 6:18:29 } +2024-07-25 18:48:48,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 824/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5193845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:48,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42979 samples/s/p 6:18:47 } +2024-07-25 18:48:51,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 826/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.52307675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.44057 samples/s/p 6:17:59 } +2024-07-25 18:48:54,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 828/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 1.5267691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:54,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43092 samples/s/p 6:18:37 } +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 830/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.5304615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43431 samples/s/p 6:18:20 } +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 832/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.5341539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43195 samples/s/p 6:18:27 } +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 834/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.537846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43798 samples/s/p 6:17:59 } +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 836/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.5415384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42962 samples/s/p 6:18:30 } +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 838/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5452308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43651 samples/s/p 6:17:59 } +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 840/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.5489231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43290 samples/s/p 6:18:11 } +2024-07-25 18:49:15,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 842/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.5526153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43853 samples/s/p 6:17:44 } +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 844/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.5563075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43653 samples/s/p 6:17:50 } +2024-07-25 18:49:21,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 846/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.5599999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:21,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43761 samples/s/p 6:17:42 } +2024-07-25 18:49:23,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 848/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5636922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:23,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43585 samples/s/p 6:17:47 } +2024-07-25 18:49:26,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 850/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.5673846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43470 samples/s/p 6:17:49 } +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 852/ 1625], loss: 1.398, per_step_time: 1470ms, lr: 1.571077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43996 samples/s/p 6:17:24 } +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 854/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.5747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:32,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43181 samples/s/p 6:17:55 } +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 856/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 1.5784615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42794 samples/s/p 6:18:08 } +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 858/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 1.5821537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44155 samples/s/p 6:17:08 } +2024-07-25 18:49:41,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 860/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.585846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:41,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44532 samples/s/p 6:16:50 } +2024-07-25 18:49:44,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 862/ 1625], loss: 1.296, per_step_time: 1479ms, lr: 1.5895384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:44,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.40553 samples/s/p 6:19:33 } +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 864/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 1.5932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42858 samples/s/p 6:17:54 } +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 866/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43264 samples/s/p 6:17:34 } +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 868/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6006154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:53,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43613 samples/s/p 6:17:16 } +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 870/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.6043077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43944 samples/s/p 6:16:59 } +2024-07-25 18:49:59,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 872/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43386 samples/s/p 6:17:20 } +2024-07-25 18:50:02,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 874/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.6116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:02,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43393 samples/s/p 6:17:17 } +2024-07-25 18:50:05,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 1.6153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:05,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44223 samples/s/p 6:16:39 } +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 878/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.6190768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.42803 samples/s/p 6:17:35 } +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 880/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.6227692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43105 samples/s/p 6:17:20 } +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 882/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44025 samples/s/p 6:16:38 } +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 884/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.6301537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43285 samples/s/p 6:17:06 } +2024-07-25 18:50:20,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 886/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.6338461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:20,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.44137 samples/s/p 6:16:28 } +2024-07-25 18:50:22,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 888/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.6375385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:22,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42898 samples/s/p 6:17:17 } +2024-07-25 18:50:25,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 890/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.6412308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43492 samples/s/p 6:16:49 } +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 892/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.6449228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43756 samples/s/p 6:16:35 } +2024-07-25 18:50:31,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 894/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.6486152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:31,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43196 samples/s/p 6:16:55 } +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 896/ 1625], loss: 1.447, per_step_time: 1474ms, lr: 1.6523076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42425 samples/s/p 6:17:24 } +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 898/ 1625], loss: 1.452, per_step_time: 1472ms, lr: 1.656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43475 samples/s/p 6:16:38 } +2024-07-25 18:50:40,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 900/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.6596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43479 samples/s/p 6:16:35 } +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 902/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43376 samples/s/p 6:16:36 } +2024-07-25 18:50:46,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 904/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 1.6670769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43943 samples/s/p 6:16:10 } +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 906/ 1625], loss: 1.376, per_step_time: 1470ms, lr: 1.6707692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43960 samples/s/p 6:16:06 } +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 908/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6744614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43845 samples/s/p 6:16:08 } +2024-07-25 18:50:55,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 910/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43345 samples/s/p 6:16:26 } +2024-07-25 18:50:58,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 912/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.681846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:58,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43565 samples/s/p 6:16:13 } +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 914/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.6855383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43894 samples/s/p 6:15:57 } +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 916/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.6892307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43166 samples/s/p 6:16:24 } +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 918/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.692923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43603 samples/s/p 6:16:03 } +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 920/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.6966154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43148 samples/s/p 6:16:19 } +2024-07-25 18:51:13,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 922/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.7003076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43614 samples/s/p 6:15:57 } +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 924/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43051 samples/s/p 6:16:17 } +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 926/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.7076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43786 samples/s/p 6:15:44 } +2024-07-25 18:51:22,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 928/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.7113845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43562 samples/s/p 6:15:50 } +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 930/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 1.7150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43975 samples/s/p 6:15:30 } +2024-07-25 18:51:27,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 932/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.718769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43855 samples/s/p 6:15:32 } +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 934/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 1.7224615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43678 samples/s/p 6:15:36 } +2024-07-25 18:51:33,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 936/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.7261538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:33,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43372 samples/s/p 6:15:46 } +2024-07-25 18:51:36,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 938/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.7298462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:36,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43148 samples/s/p 6:15:52 } +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 940/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 1.7335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:39,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43508 samples/s/p 6:15:35 } +2024-07-25 18:51:42,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 942/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 1.7372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:42,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43860 samples/s/p 6:15:17 } +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 944/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.740923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43565 samples/s/p 6:15:26 } +2024-07-25 18:51:48,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 946/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.7446153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:48,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43444 samples/s/p 6:15:28 } +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 948/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 1.7483077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42880 samples/s/p 6:15:49 } +2024-07-25 18:51:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 950/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.7519998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:54,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42899 samples/s/p 6:15:45 } +2024-07-25 18:51:57,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 952/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 1.7556922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:57,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.44111 samples/s/p 6:14:52 } +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 954/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.7593846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43247 samples/s/p 6:15:25 } +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 956/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43858 samples/s/p 6:14:57 } +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 958/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.7667691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43484 samples/s/p 6:15:09 } +2024-07-25 18:52:09,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 960/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.7704613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:09,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43007 samples/s/p 6:15:26 } +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 962/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 1.7741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43792 samples/s/p 6:14:50 } +2024-07-25 18:52:15,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 964/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.777846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43314 samples/s/p 6:15:07 } +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 966/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7815384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43444 samples/s/p 6:14:59 } +2024-07-25 18:52:21,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 968/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.7852308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43659 samples/s/p 6:14:47 } +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 970/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.788923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43241 samples/s/p 6:15:01 } +2024-07-25 18:52:26,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 972/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 1.7926153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.42968 samples/s/p 6:15:10 } +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 974/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.7963077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43057 samples/s/p 6:15:03 } +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 976/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.7999999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.43078 samples/s/p 6:14:59 } +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.8036922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.44138 samples/s/p 6:14:13 } +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 980/ 1625], loss: 1.142, per_step_time: 1482ms, lr: 1.8073844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.39639 samples/s/p 6:17:17 } +2024-07-25 18:52:41,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 982/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 1.8110768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:41,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.43019 samples/s/p 6:14:53 } +2024-07-25 18:52:44,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 984/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.8147692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:44,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43552 samples/s/p 6:14:28 } +2024-07-25 18:52:47,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 986/ 1625], loss: 1.310, per_step_time: 1470ms, lr: 1.8184615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43972 samples/s/p 6:14:08 } +2024-07-25 18:52:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 988/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.8221539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:50,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43488 samples/s/p 6:14:25 } +2024-07-25 18:52:53,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 990/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.825846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43344 samples/s/p 6:14:28 } +2024-07-25 18:52:56,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 992/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.8295383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:56,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43313 samples/s/p 6:14:26 } +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 994/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.8332306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43736 samples/s/p 6:14:06 } +2024-07-25 18:53:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 996/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43010 samples/s/p 6:14:33 } +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 998/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.8406154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43707 samples/s/p 6:14:01 } +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1000/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.8443076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43874 samples/s/p 6:13:51 } +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1002/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43327 samples/s/p 6:14:11 } +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1004/ 1625], loss: 1.311, per_step_time: 1474ms, lr: 1.8516923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.42697 samples/s/p 6:14:34 } +2024-07-25 18:53:17,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1006/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.8553847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:17,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43210 samples/s/p 6:14:10 } +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1008/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.859077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43338 samples/s/p 6:14:02 } +2024-07-25 18:53:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1010/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.862769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43542 samples/s/p 6:13:50 } +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1012/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 1.8664614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43966 samples/s/p 6:13:30 } +2024-07-25 18:53:28,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1014/ 1625], loss: 1.070, per_step_time: 1469ms, lr: 1.8701538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:28,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.44272 samples/s/p 6:13:14 } +2024-07-25 18:53:31,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1016/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.8738461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43836 samples/s/p 6:13:29 } +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1018/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.8775383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43075 samples/s/p 6:13:58 } +2024-07-25 18:53:37,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1020/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.8812307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43691 samples/s/p 6:13:29 } +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1022/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.884923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43015 samples/s/p 6:13:54 } +2024-07-25 18:53:43,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1024/ 1625], loss: 1.329, per_step_time: 1473ms, lr: 1.8886154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:43,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43092 samples/s/p 6:13:48 } +2024-07-25 18:53:46,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1026/ 1625], loss: 1.394, per_step_time: 1470ms, lr: 1.8923076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:46,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.44001 samples/s/p 6:13:08 } +2024-07-25 18:53:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1028/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.8959998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:49,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43859 samples/s/p 6:13:11 } +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1030/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.8996921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43643 samples/s/p 6:13:17 } +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1032/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.9033845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43500 samples/s/p 6:13:19 } +2024-07-25 18:53:58,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1034/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.9070769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:58,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43688 samples/s/p 6:13:09 } +2024-07-25 18:54:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1036/ 1625], loss: 1.235, per_step_time: 1477ms, lr: 1.9107692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.41592 samples/s/p 6:14:33 } +2024-07-25 18:54:04,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1038/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 1.9144614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42396 samples/s/p 6:13:56 } +2024-07-25 18:54:07,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1040/ 1625], loss: 1.367, per_step_time: 1473ms, lr: 1.9181538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:07,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42955 samples/s/p 6:13:30 } +2024-07-25 18:54:10,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1042/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.921846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:10,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43159 samples/s/p 6:13:19 } +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1044/ 1625], loss: 1.122, per_step_time: 1474ms, lr: 1.9255383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42689 samples/s/p 6:13:35 } +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1046/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 1.9292307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42992 samples/s/p 6:13:20 } +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1048/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.9329229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43601 samples/s/p 6:12:52 } +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1050/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.9366153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43669 samples/s/p 6:12:46 } +2024-07-25 18:54:25,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1052/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.9403076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43536 samples/s/p 6:12:49 } +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1054/ 1625], loss: 1.456, per_step_time: 1473ms, lr: 1.944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43064 samples/s/p 6:13:05 } +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1056/ 1625], loss: 0.973, per_step_time: 1473ms, lr: 1.9476924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42781 samples/s/p 6:13:14 } +2024-07-25 18:54:33,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1058/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.9513845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:33,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44186 samples/s/p 6:12:13 } +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1060/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.9550767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44097 samples/s/p 6:12:14 } +2024-07-25 18:54:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1062/ 1625], loss: 1.185, per_step_time: 1474ms, lr: 1.9587691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:39,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42494 samples/s/p 6:13:17 } +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1064/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.9624615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43527 samples/s/p 6:12:31 } +2024-07-25 18:54:45,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1066/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9661538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43908 samples/s/p 6:12:13 } +2024-07-25 18:54:48,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1068/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.969846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.42934 samples/s/p 6:12:50 } +2024-07-25 18:54:51,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1070/ 1625], loss: 1.237, per_step_time: 1470ms, lr: 1.9735384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:51,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.44004 samples/s/p 6:12:03 } +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1072/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.9772307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43415 samples/s/p 6:12:24 } +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1074/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.9809231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43655 samples/s/p 6:12:11 } +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1076/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 1.9846153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43645 samples/s/p 6:12:09 } +2024-07-25 18:55:03,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1078/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 1.9883075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43108 samples/s/p 6:12:28 } +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1080/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.9919999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43403 samples/s/p 6:12:13 } +2024-07-25 18:55:09,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1082/ 1625], loss: 1.403, per_step_time: 1472ms, lr: 1.9956922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:09,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43239 samples/s/p 6:12:17 } +2024-07-25 18:55:12,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1084/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.9993846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43337 samples/s/p 6:12:10 } +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1086/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.0030768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42838 samples/s/p 6:12:27 } +2024-07-25 18:55:18,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1088/ 1625], loss: 1.225, per_step_time: 1474ms, lr: 2.0067691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42596 samples/s/p 6:12:34 } +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1090/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.0104615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43014 samples/s/p 6:12:14 } +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1092/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.0141539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43771 samples/s/p 6:11:40 } +2024-07-25 18:55:27,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1094/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.017846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:27,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43030 samples/s/p 6:12:08 } +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1096/ 1625], loss: 1.179, per_step_time: 1474ms, lr: 2.0215382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42671 samples/s/p 6:12:19 } +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1098/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.0252306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43643 samples/s/p 6:11:36 } +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1100/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.028923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43275 samples/s/p 6:11:49 } +2024-07-25 18:55:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1102/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0326153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:38,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43439 samples/s/p 6:11:39 } +2024-07-25 18:55:41,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1104/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.0363077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:41,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.44082 samples/s/p 6:11:10 } +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1106/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.0399999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43321 samples/s/p 6:11:38 } +2024-07-25 18:55:47,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1108/ 1625], loss: 1.259, per_step_time: 1477ms, lr: 2.0436923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.41526 samples/s/p 6:12:49 } +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1110/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.0473844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43281 samples/s/p 6:11:34 } +2024-07-25 18:55:53,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1112/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0510768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43045 samples/s/p 6:11:40 } +2024-07-25 18:55:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1114/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.0547692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42766 samples/s/p 6:11:49 } +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1116/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.0584614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43342 samples/s/p 6:11:22 } +2024-07-25 18:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1118/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.0621537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:02,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43325 samples/s/p 6:11:20 } +2024-07-25 18:56:05,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1120/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 2.0658461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:05,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42708 samples/s/p 6:11:42 } +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1122/ 1625], loss: 1.272, per_step_time: 1475ms, lr: 2.0695385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42137 samples/s/p 6:12:03 } +2024-07-25 18:56:11,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1124/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0732308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:11,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43729 samples/s/p 6:10:55 } +2024-07-25 18:56:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1126/ 1625], loss: 1.313, per_step_time: 1471ms, lr: 2.0769228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:14,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43588 samples/s/p 6:10:58 } +2024-07-25 18:56:17,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1128/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 2.0806152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42940 samples/s/p 6:11:21 } +2024-07-25 18:56:20,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1130/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0843076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:20,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43924 samples/s/p 6:10:38 } +2024-07-25 18:56:23,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1132/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43597 samples/s/p 6:10:48 } +2024-07-25 18:56:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1134/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.0916923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43486 samples/s/p 6:10:50 } +2024-07-25 18:56:29,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1136/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.0953845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43227 samples/s/p 6:10:58 } +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1138/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0990768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43061 samples/s/p 6:11:01 } +2024-07-25 18:56:34,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1140/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.1027692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:34,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43534 samples/s/p 6:10:39 } +2024-07-25 18:56:37,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1142/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.1064616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:37,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42766 samples/s/p 6:11:08 } +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1144/ 1625], loss: 1.341, per_step_time: 1474ms, lr: 2.1101538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42595 samples/s/p 6:11:12 } +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1146/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43435 samples/s/p 6:10:34 } +2024-07-25 18:56:46,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1148/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 2.1175383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:46,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42862 samples/s/p 6:10:55 } +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1150/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.1212307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42966 samples/s/p 6:10:48 } +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1152/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.124923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43283 samples/s/p 6:10:32 } +2024-07-25 18:56:55,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1154/ 1625], loss: 0.892, per_step_time: 1471ms, lr: 2.1286154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:55,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43764 samples/s/p 6:10:09 } +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1156/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.1323076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43286 samples/s/p 6:10:26 } +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1158/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43197 samples/s/p 6:10:26 } +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1160/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.1396922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43289 samples/s/p 6:10:20 } +2024-07-25 18:57:07,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1162/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 2.1433845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.44465 samples/s/p 6:09:29 } +2024-07-25 18:57:10,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1164/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.1470767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:10,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43708 samples/s/p 6:09:57 } +2024-07-25 18:57:13,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1166/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:13,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43204 samples/s/p 6:10:14 } +2024-07-25 18:57:16,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1168/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.1544614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:16,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43561 samples/s/p 6:09:57 } +2024-07-25 18:57:19,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1170/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.1581538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:19,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43538 samples/s/p 6:09:55 } +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1172/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 2.1618462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.41793 samples/s/p 6:11:03 } +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1174/ 1625], loss: 1.450, per_step_time: 1471ms, lr: 2.1655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43832 samples/s/p 6:09:37 } +2024-07-25 18:57:28,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1176/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 2.1692307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.42977 samples/s/p 6:10:09 } +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1178/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1729229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43566 samples/s/p 6:09:42 } +2024-07-25 18:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1180/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.1766153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:33,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43353 samples/s/p 6:09:48 } +2024-07-25 18:57:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1182/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.1803076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43763 samples/s/p 6:09:28 } +2024-07-25 18:57:39,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1184/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.1839998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42748 samples/s/p 6:10:06 } +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1186/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 2.1876922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43069 samples/s/p 6:09:50 } +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1188/ 1625], loss: 1.028, per_step_time: 1475ms, lr: 2.1913846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42189 samples/s/p 6:10:23 } +2024-07-25 18:57:48,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1190/ 1625], loss: 1.326, per_step_time: 1470ms, lr: 2.195077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:48,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.44111 samples/s/p 6:09:02 } +2024-07-25 18:57:51,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1192/ 1625], loss: 1.019, per_step_time: 1474ms, lr: 2.1987693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:51,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42524 samples/s/p 6:10:04 } +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1194/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 2.2024613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43366 samples/s/p 6:09:27 } +2024-07-25 18:57:57,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1196/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.2061537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43730 samples/s/p 6:09:09 } +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1198/ 1625], loss: 0.908, per_step_time: 1471ms, lr: 2.209846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43755 samples/s/p 6:09:05 } +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1200/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.2135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43613 samples/s/p 6:09:08 } +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1202/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.2172308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43130 samples/s/p 6:09:24 } +2024-07-25 18:58:09,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1204/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 2.220923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:09,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.42956 samples/s/p 6:09:28 } +2024-07-25 18:58:12,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1206/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.2246153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:12,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43503 samples/s/p 6:09:03 } +2024-07-25 18:58:15,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1208/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.2283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:15,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43263 samples/s/p 6:09:10 } +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1210/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.2319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43329 samples/s/p 6:09:04 } +2024-07-25 18:58:21,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1212/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.2356922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.44107 samples/s/p 6:08:30 } +2024-07-25 18:58:24,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1214/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.2393844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43331 samples/s/p 6:08:59 } +2024-07-25 18:58:27,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1216/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.2430768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:27,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43847 samples/s/p 6:08:35 } +2024-07-25 18:58:30,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1218/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.2467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43425 samples/s/p 6:08:49 } +2024-07-25 18:58:32,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1220/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.2504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43816 samples/s/p 6:08:30 } +2024-07-25 18:58:35,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1222/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.2541539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43513 samples/s/p 6:08:39 } +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1224/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.257846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.42923 samples/s/p 6:09:00 } +2024-07-25 18:58:41,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1226/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.2615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:41,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43616 samples/s/p 6:08:29 } +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1228/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.2652306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43517 samples/s/p 6:08:30 } +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1230/ 1625], loss: 1.198, per_step_time: 1474ms, lr: 2.268923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.42546 samples/s/p 6:09:07 } +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1232/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2726152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43337 samples/s/p 6:08:32 } +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1234/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 2.2763075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43477 samples/s/p 6:08:23 } +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1236/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2799999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43817 samples/s/p 6:08:06 } +2024-07-25 18:58:59,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1238/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 2.2836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:59,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43560 samples/s/p 6:08:14 } +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1240/ 1625], loss: 1.335, per_step_time: 1470ms, lr: 2.2873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43853 samples/s/p 6:07:59 } +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.2910768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43667 samples/s/p 6:08:04 } +2024-07-25 18:59:08,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1244/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.294769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.44105 samples/s/p 6:07:43 } +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1246/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2984614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.42906 samples/s/p 6:08:29 } +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1248/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.3021537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:14,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43338 samples/s/p 6:08:08 } +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1250/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3058461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43569 samples/s/p 6:07:56 } +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1252/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43465 samples/s/p 6:07:57 } +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1254/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.3132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43607 samples/s/p 6:07:48 } +2024-07-25 18:59:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1256/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43226 samples/s/p 6:08:01 } +2024-07-25 18:59:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1258/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.3206154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43512 samples/s/p 6:07:46 } +2024-07-25 18:59:32,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1260/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.3243078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:32,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42572 samples/s/p 6:08:22 } +2024-07-25 18:59:34,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1262/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3279998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:34,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42901 samples/s/p 6:08:05 } +2024-07-25 18:59:37,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1264/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.3316921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43604 samples/s/p 6:07:34 } +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1266/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.3353845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43958 samples/s/p 6:07:16 } +2024-07-25 18:59:43,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1268/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.3390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43870 samples/s/p 6:07:17 } +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.3427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43428 samples/s/p 6:07:32 } +2024-07-25 18:59:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1272/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3464614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43534 samples/s/p 6:07:25 } +2024-07-25 18:59:52,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1274/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.3501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:52,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42954 samples/s/p 6:07:45 } +2024-07-25 18:59:55,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1276/ 1625], loss: 1.259, per_step_time: 1475ms, lr: 2.3538461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:55,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42209 samples/s/p 6:08:13 } +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1278/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.3575383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44071 samples/s/p 6:06:54 } +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1280/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 2.3612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44040 samples/s/p 6:06:53 } +2024-07-25 19:00:04,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1282/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.3649229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43195 samples/s/p 6:07:24 } +2024-07-25 19:00:07,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1284/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 2.3686152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43849 samples/s/p 6:06:54 } +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1286/ 1625], loss: 0.877, per_step_time: 1471ms, lr: 2.3723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43560 samples/s/p 6:07:03 } +2024-07-25 19:00:13,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1288/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43599 samples/s/p 6:06:59 } +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1290/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.3796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42933 samples/s/p 6:07:23 } +2024-07-25 19:00:19,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1292/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 2.3833845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:19,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43035 samples/s/p 6:07:16 } +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1294/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.3870767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43137 samples/s/p 6:07:09 } +2024-07-25 19:00:25,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1296/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43790 samples/s/p 6:06:39 } +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1298/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.3944614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43750 samples/s/p 6:06:38 } +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1300/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 2.3981538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.44437 samples/s/p 6:06:07 } +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1302/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 2.401846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43104 samples/s/p 6:06:58 } +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1304/ 1625], loss: 1.201, per_step_time: 1475ms, lr: 2.4055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.42348 samples/s/p 6:07:26 } +2024-07-25 19:00:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1306/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.4092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43233 samples/s/p 6:06:47 } +2024-07-25 19:00:42,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1308/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.4129231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43713 samples/s/p 6:06:25 } +2024-07-25 19:00:45,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1310/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.4166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:45,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.42893 samples/s/p 6:06:55 } +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1312/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.4203075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44184 samples/s/p 6:06:00 } +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1314/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.4239998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44217 samples/s/p 6:05:55 } +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1316/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.4276922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43497 samples/s/p 6:06:22 } +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1318/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.4313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43378 samples/s/p 6:06:23 } +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1320/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.4350767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43473 samples/s/p 6:06:17 } +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1322/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.4387691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43379 samples/s/p 6:06:18 } +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1324/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.4424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.42957 samples/s/p 6:06:32 } +2024-07-25 19:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1326/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 2.4461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43235 samples/s/p 6:06:17 } +2024-07-25 19:01:12,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1328/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.449846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:12,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43511 samples/s/p 6:06:03 } +2024-07-25 19:01:15,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1330/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.4535382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:15,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44175 samples/s/p 6:05:34 } +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1332/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.4572306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43740 samples/s/p 6:05:48 } +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1334/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.460923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43186 samples/s/p 6:06:08 } +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1336/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.4646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43704 samples/s/p 6:05:44 } +2024-07-25 19:01:27,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1338/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.4683077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44060 samples/s/p 6:05:26 } +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1340/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.4719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43445 samples/s/p 6:05:48 } +2024-07-25 19:01:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1342/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.4756922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:33,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43368 samples/s/p 6:05:49 } +2024-07-25 19:01:35,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1344/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.4793844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:35,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43235 samples/s/p 6:05:51 } +2024-07-25 19:01:38,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:38,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43505 samples/s/p 6:05:37 } +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1348/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.4867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43404 samples/s/p 6:05:38 } +2024-07-25 19:01:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1350/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.4904613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43677 samples/s/p 6:05:24 } +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1352/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4941537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43362 samples/s/p 6:05:34 } +2024-07-25 19:01:50,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1354/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.497846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43785 samples/s/p 6:05:14 } +2024-07-25 19:01:53,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1356/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.5015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43507 samples/s/p 6:05:22 } +2024-07-25 19:01:56,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1358/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 2.5052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:56,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43440 samples/s/p 6:05:22 } +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1360/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.508923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43340 samples/s/p 6:05:23 } +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1362/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.5126152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43193 samples/s/p 6:05:26 } +2024-07-25 19:02:05,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1364/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5163075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:05,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43757 samples/s/p 6:05:00 } +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1366/ 1625], loss: 1.220, per_step_time: 1474ms, lr: 2.5199999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.42650 samples/s/p 6:05:42 } +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1368/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.5236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43476 samples/s/p 6:05:06 } +2024-07-25 19:02:14,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1370/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.5273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:14,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43744 samples/s/p 6:04:52 } +2024-07-25 19:02:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1372/ 1625], loss: 1.337, per_step_time: 1470ms, lr: 2.5310768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43866 samples/s/p 6:04:44 } +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1374/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.5347692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43301 samples/s/p 6:05:04 } +2024-07-25 19:02:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1376/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5384616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43794 samples/s/p 6:04:41 } +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1378/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.5421536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42836 samples/s/p 6:05:17 } +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1380/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.545846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43527 samples/s/p 6:04:46 } +2024-07-25 19:02:32,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1382/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5495383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:32,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43501 samples/s/p 6:04:44 } +2024-07-25 19:02:34,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1384/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.5532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:34,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42810 samples/s/p 6:05:09 } +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1386/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.556923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42895 samples/s/p 6:05:03 } +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1388/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 2.5606152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42554 samples/s/p 6:05:14 } +2024-07-25 19:02:43,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1390/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.5643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43743 samples/s/p 6:04:23 } +2024-07-25 19:02:46,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1392/ 1625], loss: 1.372, per_step_time: 1471ms, lr: 2.568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43508 samples/s/p 6:04:29 } +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1394/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.5716923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43682 samples/s/p 6:04:19 } +2024-07-25 19:02:52,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1396/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43781 samples/s/p 6:04:12 } +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1398/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.5790767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.44085 samples/s/p 6:03:57 } +2024-07-25 19:02:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1400/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.582769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43622 samples/s/p 6:04:13 } +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:03:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1402/ 1625], loss: 1.293, per_step_time: 3240ms, lr: 2.5864614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 2.46910 samples/s/p 13:21:48 } +2024-07-25 19:03:38,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1404/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.5901538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:38,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43329 samples/s/p 6:04:19 } +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1406/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.5938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43517 samples/s/p 6:04:08 } +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1408/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5975383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43894 samples/s/p 6:03:50 } +2024-07-25 19:03:47,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1410/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6012307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:47,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43790 samples/s/p 6:03:51 } +2024-07-25 19:03:50,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1412/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.6049229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:50,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43511 samples/s/p 6:04:00 } +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1414/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.6086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.42992 samples/s/p 6:04:18 } +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1416/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.6123076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43925 samples/s/p 6:03:37 } +2024-07-25 19:03:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1418/ 1625], loss: 1.287, per_step_time: 1473ms, lr: 2.6159998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43056 samples/s/p 6:04:09 } +2024-07-25 19:04:01,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1420/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.6196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:01,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.42944 samples/s/p 6:04:11 } +2024-07-25 19:04:04,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1422/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.6233845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43428 samples/s/p 6:03:48 } +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1424/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.6270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43229 samples/s/p 6:03:53 } +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1426/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6307693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.42989 samples/s/p 6:04:00 } +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.6344613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43788 samples/s/p 6:03:25 } +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1430/ 1625], loss: 1.287, per_step_time: 1469ms, lr: 2.6381536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44247 samples/s/p 6:03:04 } +2024-07-25 19:04:19,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1432/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.641846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:19,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44118 samples/s/p 6:03:06 } +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1434/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.6455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43139 samples/s/p 6:03:42 } +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1436/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43899 samples/s/p 6:03:09 } +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1438/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.652923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44025 samples/s/p 6:03:01 } +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1440/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.6566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43455 samples/s/p 6:03:21 } +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1442/ 1625], loss: 1.485, per_step_time: 1471ms, lr: 2.6603077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43646 samples/s/p 6:03:10 } +2024-07-25 19:04:37,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1444/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43158 samples/s/p 6:03:27 } +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1446/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.6676922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43227 samples/s/p 6:03:21 } +2024-07-25 19:04:43,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1448/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6713844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:43,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43180 samples/s/p 6:03:20 } +2024-07-25 19:04:46,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1450/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.6750768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:46,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43809 samples/s/p 6:02:52 } +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1452/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 2.6787691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.42970 samples/s/p 6:03:23 } +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1454/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.6824615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43388 samples/s/p 6:03:03 } +2024-07-25 19:04:55,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1456/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.6861537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:55,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43176 samples/s/p 6:03:08 } +2024-07-25 19:04:58,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1458/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.689846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43058 samples/s/p 6:03:10 } +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1460/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6935384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43716 samples/s/p 6:02:41 } +2024-07-25 19:05:03,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1462/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.6972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:03,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44181 samples/s/p 6:02:19 } +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1464/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.700923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44091 samples/s/p 6:02:20 } +2024-07-25 19:05:09,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1466/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.7046151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:09,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43920 samples/s/p 6:02:24 } +2024-07-25 19:05:12,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1468/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.7083075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:12,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43165 samples/s/p 6:02:51 } +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1470/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.7119999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43526 samples/s/p 6:02:34 } +2024-07-25 19:05:18,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1472/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 2.7156922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:18,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43039 samples/s/p 6:02:50 } +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1474/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 2.7193846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43157 samples/s/p 6:02:43 } +2024-07-25 19:05:24,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1476/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.7230768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:24,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43673 samples/s/p 6:02:19 } +2024-07-25 19:05:27,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1478/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.7267692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:27,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42494 samples/s/p 6:03:03 } +2024-07-25 19:05:30,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1480/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.7304613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:30,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43457 samples/s/p 6:02:22 } +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1482/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.7341537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43455 samples/s/p 6:02:19 } +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1484/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.737846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42876 samples/s/p 6:02:39 } +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1486/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.7415383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42870 samples/s/p 6:02:36 } +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1488/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.7452306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43306 samples/s/p 6:02:16 } +2024-07-25 19:05:45,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1490/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.748923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:45,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43586 samples/s/p 6:02:02 } +2024-07-25 19:05:48,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1492/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.7526154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:48,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43281 samples/s/p 6:02:11 } +2024-07-25 19:05:51,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1494/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.7563077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43507 samples/s/p 6:01:59 } +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1496/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7599997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43385 samples/s/p 6:02:01 } +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1498/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7636921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43244 samples/s/p 6:02:04 } +2024-07-25 19:06:00,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1500/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.7673845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:00,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43431 samples/s/p 6:01:53 } +2024-07-25 19:06:02,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1502/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.7710768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43374 samples/s/p 6:01:53 } +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1504/ 1625], loss: 1.168, per_step_time: 1474ms, lr: 2.7747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42615 samples/s/p 6:02:20 } +2024-07-25 19:06:08,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1506/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.7784614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43747 samples/s/p 6:01:32 } +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1508/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.7821538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43390 samples/s/p 6:01:43 } +2024-07-25 19:06:14,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1510/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.7858461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:14,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43143 samples/s/p 6:01:50 } +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1512/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7895383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43353 samples/s/p 6:01:39 } +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1514/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.7932307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43256 samples/s/p 6:01:40 } +2024-07-25 19:06:23,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1516/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.7969229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:23,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42814 samples/s/p 6:01:54 } +2024-07-25 19:06:26,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1518/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8006152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43991 samples/s/p 6:01:05 } +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1520/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8043076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43392 samples/s/p 6:01:26 } +2024-07-25 19:06:32,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:32,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43285 samples/s/p 6:01:27 } +2024-07-25 19:06:35,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1524/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 2.8116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:35,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43385 samples/s/p 6:01:20 } +2024-07-25 19:06:38,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1526/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.8153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42727 samples/s/p 6:01:43 } +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1528/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8190769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43367 samples/s/p 6:01:15 } +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1530/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.822769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43814 samples/s/p 6:00:54 } +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1532/ 1625], loss: 1.023, per_step_time: 1473ms, lr: 2.8264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42965 samples/s/p 6:01:25 } +2024-07-25 19:06:50,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1534/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.8301536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:50,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43559 samples/s/p 6:00:58 } +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1536/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43896 samples/s/p 6:00:42 } +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1538/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.8375383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.44047 samples/s/p 6:00:33 } +2024-07-25 19:06:59,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1540/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.8412307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43384 samples/s/p 6:00:56 } +2024-07-25 19:07:02,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1542/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.844923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:02,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43274 samples/s/p 6:00:58 } +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1544/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8486153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43165 samples/s/p 6:00:59 } +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1546/ 1625], loss: 0.967, per_step_time: 1474ms, lr: 2.8523074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.42375 samples/s/p 6:01:28 } +2024-07-25 19:07:10,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1548/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8559998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43180 samples/s/p 6:00:53 } +2024-07-25 19:07:13,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1550/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.8596922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:13,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43094 samples/s/p 6:00:53 } +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1552/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.8633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43707 samples/s/p 6:00:26 } +2024-07-25 19:07:19,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1554/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.8670767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43167 samples/s/p 6:00:44 } +2024-07-25 19:07:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1556/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.8707691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:22,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42748 samples/s/p 6:00:58 } +2024-07-25 19:07:25,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1558/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.8744615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:25,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43340 samples/s/p 6:00:32 } +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1560/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.8781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43928 samples/s/p 6:00:05 } +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1562/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.8818462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43101 samples/s/p 6:00:35 } +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1564/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8855382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43620 samples/s/p 6:00:12 } +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1566/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.8892306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42793 samples/s/p 6:00:42 } +2024-07-25 19:07:40,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1568/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.892923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:40,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43126 samples/s/p 6:00:25 } +2024-07-25 19:07:43,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1570/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.8966153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:43,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.42573 samples/s/p 6:00:44 } +2024-07-25 19:07:46,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1572/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 2.9003077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43111 samples/s/p 6:00:20 } +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1574/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.9039998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43720 samples/s/p 5:59:53 } +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1576/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43304 samples/s/p 6:00:07 } +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1578/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43339 samples/s/p 6:00:02 } +2024-07-25 19:07:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1580/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.9150768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:58,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43901 samples/s/p 5:59:37 } +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1582/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.9187691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43761 samples/s/p 5:59:40 } +2024-07-25 19:08:04,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1584/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9224613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43561 samples/s/p 5:59:45 } +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1586/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 2.9261537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43752 samples/s/p 5:59:34 } +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1588/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.929846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43670 samples/s/p 5:59:34 } +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1590/ 1625], loss: 1.431, per_step_time: 1471ms, lr: 2.9335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43627 samples/s/p 5:59:33 } +2024-07-25 19:08:15,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:15,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43260 samples/s/p 5:59:45 } +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1594/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.940923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43576 samples/s/p 5:59:29 } +2024-07-25 19:08:21,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1596/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 2.9446152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:21,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.42031 samples/s/p 6:00:28 } +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1598/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.9483075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.44072 samples/s/p 5:59:04 } +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1600/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.9519999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43785 samples/s/p 5:59:12 } +2024-07-25 19:08:30,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1602/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.955692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43102 samples/s/p 5:59:36 } +2024-07-25 19:08:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1604/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.9593844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42531 samples/s/p 5:59:56 } +2024-07-25 19:08:36,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1606/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.9630768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:36,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43471 samples/s/p 5:59:16 } +2024-07-25 19:08:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1608/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9667692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43322 samples/s/p 5:59:19 } +2024-07-25 19:08:42,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1610/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.9704615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:42,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42402 samples/s/p 5:59:52 } +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1612/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43780 samples/s/p 5:58:55 } +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1614/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.9778459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43421 samples/s/p 5:59:06 } +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1616/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9815383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43157 samples/s/p 5:59:13 } +2024-07-25 19:08:54,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1618/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9852306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.44125 samples/s/p 5:58:32 } +2024-07-25 19:08:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1620/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.988923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:57,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43113 samples/s/p 5:59:09 } +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1622/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9926152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43730 samples/s/p 5:58:42 } +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1624/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.9963076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:03,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43085 samples/s/p 5:59:05 } +2024-07-25 19:09:06,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1477ms, lr: 3e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:06,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.41469 samples/s/p 6:00:06 } +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 3/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.9999997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43797 samples/s/p 5:58:30 } +2024-07-25 19:09:11,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 5/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.9999994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:11,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43434 samples/s/p 5:58:42 } +2024-07-25 19:09:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 7/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.9999987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:14,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43334 samples/s/p 5:58:43 } +2024-07-25 19:09:17,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 9/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.999998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:17,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43540 samples/s/p 5:58:32 } +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 11/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 2.9999967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43063 samples/s/p 5:58:48 } +2024-07-25 19:09:23,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 13/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9999952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.42698 samples/s/p 5:58:59 } +2024-07-25 19:09:26,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 15/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9999934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43538 samples/s/p 5:58:23 } +2024-07-25 19:09:29,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 17/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9999912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:29,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43476 samples/s/p 5:58:23 } +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 19/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.999989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43533 samples/s/p 5:58:17 } +2024-07-25 19:09:35,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 21/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.9999865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:35,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43416 samples/s/p 5:58:19 } +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 23/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.9999837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43994 samples/s/p 5:57:53 } +2024-07-25 19:09:41,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 25/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9999806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:41,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43807 samples/s/p 5:57:58 } +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 27/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9999774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43655 samples/s/p 5:58:01 } +2024-07-25 19:09:47,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 29/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.9999737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:47,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43724 samples/s/p 5:57:55 } +2024-07-25 19:09:50,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 31/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.99997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43831 samples/s/p 5:57:48 } +2024-07-25 19:09:53,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 33/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9999657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43483 samples/s/p 5:57:59 } +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 35/ 1625], loss: 1.368, per_step_time: 1470ms, lr: 2.9999612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43860 samples/s/p 5:57:41 } +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 37/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 2.9999566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43857 samples/s/p 5:57:38 } +2024-07-25 19:10:02,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 39/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.9999517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:02,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43995 samples/s/p 5:57:30 } +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 41/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 2.9999464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43894 samples/s/p 5:57:31 } +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 43/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9999408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43083 samples/s/p 5:58:00 } +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 45/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9999354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44000 samples/s/p 5:57:21 } +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 47/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.999929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43531 samples/s/p 5:57:36 } +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 49/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.9999228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43662 samples/s/p 5:57:28 } +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 51/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.9999163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43539 samples/s/p 5:57:30 } +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 53/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 2.9999095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.42392 samples/s/p 5:58:12 } +2024-07-25 19:10:25,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 55/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.9999024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:25,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44369 samples/s/p 5:56:51 } +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 57/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.999895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43166 samples/s/p 5:57:36 } +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 59/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9998875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43836 samples/s/p 5:57:07 } +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 61/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.9998797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42960 samples/s/p 5:57:38 } +2024-07-25 19:10:37,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 63/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9998713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:37,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43250 samples/s/p 5:57:24 } +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 65/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.999863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42848 samples/s/p 5:57:37 } +2024-07-25 19:10:43,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 67/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9998542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43120 samples/s/p 5:57:23 } +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 69/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.9998453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42896 samples/s/p 5:57:29 } +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 71/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.999836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43660 samples/s/p 5:56:56 } +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 73/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9998266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:52,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43463 samples/s/p 5:57:01 } +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 75/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 2.9998168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43968 samples/s/p 5:56:38 } +2024-07-25 19:10:58,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 77/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9998067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:58,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43616 samples/s/p 5:56:49 } +2024-07-25 19:11:01,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 79/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9997964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:01,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43678 samples/s/p 5:56:43 } +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 81/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.9997858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43572 samples/s/p 5:56:45 } +2024-07-25 19:11:07,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 83/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.999775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:07,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42668 samples/s/p 5:57:17 } +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 85/ 1625], loss: 1.437, per_step_time: 1471ms, lr: 2.9997638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43545 samples/s/p 5:56:40 } +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 87/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.9997524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42714 samples/s/p 5:57:10 } +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 89/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.9997409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43626 samples/s/p 5:56:31 } +2024-07-25 19:11:18,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 91/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9997289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:18,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43464 samples/s/p 5:56:34 } +2024-07-25 19:11:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 93/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.9997167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43227 samples/s/p 5:56:40 } +2024-07-25 19:11:24,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 95/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 2.9997043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:24,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43218 samples/s/p 5:56:38 } +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 97/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9996916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:27,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43329 samples/s/p 5:56:31 } +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 99/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9996787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43298 samples/s/p 5:56:29 } +2024-07-25 19:11:33,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 101/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 2.9996652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:33,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.44310 samples/s/p 5:55:46 } +2024-07-25 19:11:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 103/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.9996518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43191 samples/s/p 5:56:27 } +2024-07-25 19:11:39,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 105/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9996381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:39,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43734 samples/s/p 5:56:03 } +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 2.9996241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42392 samples/s/p 5:56:53 } +2024-07-25 19:11:45,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 109/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9996096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:45,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43761 samples/s/p 5:55:56 } +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 111/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 2.999595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43529 samples/s/p 5:56:02 } +2024-07-25 19:11:51,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 113/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 2.9995803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:51,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43073 samples/s/p 5:56:17 } +2024-07-25 19:11:54,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 115/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9995652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43644 samples/s/p 5:55:52 } +2024-07-25 19:11:57,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 117/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.9995497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:57,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43292 samples/s/p 5:56:03 } +2024-07-25 19:12:00,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 119/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.9995343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43078 samples/s/p 5:56:08 } +2024-07-25 19:12:03,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 121/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9995184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:03,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42900 samples/s/p 5:56:12 } +2024-07-25 19:12:06,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 123/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.999502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:06,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43104 samples/s/p 5:56:01 } +2024-07-25 19:12:09,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 125/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 2.9994857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:09,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.44162 samples/s/p 5:55:17 } +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 127/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.9994688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43377 samples/s/p 5:55:45 } +2024-07-25 19:12:14,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 129/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.999452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42921 samples/s/p 5:56:00 } +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 131/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.9994346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43861 samples/s/p 5:55:20 } +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 133/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.9994171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43923 samples/s/p 5:55:14 } +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 135/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.9993993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42871 samples/s/p 5:55:53 } +2024-07-25 19:12:26,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 137/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.9993813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:26,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43233 samples/s/p 5:55:35 } +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 139/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.9993627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43233 samples/s/p 5:55:33 } +2024-07-25 19:12:32,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 141/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.9993444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:32,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43394 samples/s/p 5:55:23 } +2024-07-25 19:12:35,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 143/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9993254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:35,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42941 samples/s/p 5:55:38 } +2024-07-25 19:12:38,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 145/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.9993065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:38,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43130 samples/s/p 5:55:28 } +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 147/ 1625], loss: 1.284, per_step_time: 1469ms, lr: 2.9992867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.44376 samples/s/p 5:54:36 } +2024-07-25 19:12:44,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 149/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.9992674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:44,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42805 samples/s/p 5:55:35 } +2024-07-25 19:12:47,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 151/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.9992474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:47,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43572 samples/s/p 5:55:02 } +2024-07-25 19:12:50,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 153/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.9992269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:50,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43205 samples/s/p 5:55:13 } +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 155/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9992065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43430 samples/s/p 5:55:01 } +2024-07-25 19:12:56,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 157/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9991857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43226 samples/s/p 5:55:06 } +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 159/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9991646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43389 samples/s/p 5:54:57 } +2024-07-25 19:13:02,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 161/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9991435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:02,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43629 samples/s/p 5:54:45 } +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 163/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.9991223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43556 samples/s/p 5:54:45 } +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 165/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9991003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43214 samples/s/p 5:54:55 } +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 167/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.999078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43153 samples/s/p 5:54:54 } +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 169/ 1625], loss: 1.446, per_step_time: 1471ms, lr: 2.9990559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43832 samples/s/p 5:54:25 } +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 171/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 2.9990333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43213 samples/s/p 5:54:46 } +2024-07-25 19:13:19,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 173/ 1625], loss: 1.360, per_step_time: 1473ms, lr: 2.9990104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42999 samples/s/p 5:54:52 } +2024-07-25 19:13:22,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 175/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9989871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:22,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43478 samples/s/p 5:54:30 } +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 177/ 1625], loss: 0.964, per_step_time: 1473ms, lr: 2.9989636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:25,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42772 samples/s/p 5:54:55 } +2024-07-25 19:13:28,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 179/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.99894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42896 samples/s/p 5:54:47 } +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 181/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.9989162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43844 samples/s/p 5:54:07 } +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 183/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.998892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.44080 samples/s/p 5:53:55 } +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 185/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 2.9988674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43087 samples/s/p 5:54:31 } +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 187/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9988425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43618 samples/s/p 5:54:07 } +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 189/ 1625], loss: 1.393, per_step_time: 1472ms, lr: 2.9988176e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43179 samples/s/p 5:54:21 } +2024-07-25 19:13:46,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 191/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9987923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43133 samples/s/p 5:54:20 } +2024-07-25 19:13:49,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 193/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.9987668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:49,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43464 samples/s/p 5:54:04 } +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 195/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9987412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43124 samples/s/p 5:54:14 } +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 197/ 1625], loss: 1.166, per_step_time: 1469ms, lr: 2.998715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.44250 samples/s/p 5:53:27 } +2024-07-25 19:13:58,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 199/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.9986886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43010 samples/s/p 5:54:13 } +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 201/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.9986619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43667 samples/s/p 5:53:44 } +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 203/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.9986351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43363 samples/s/p 5:53:53 } +2024-07-25 19:14:07,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 205/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9986079e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:07,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43774 samples/s/p 5:53:34 } +2024-07-25 19:14:10,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 207/ 1625], loss: 1.261, per_step_time: 1474ms, lr: 2.9985804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:10,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42704 samples/s/p 5:54:13 } +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 209/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9985527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43341 samples/s/p 5:53:45 } +2024-07-25 19:14:15,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 211/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9985247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:15,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42638 samples/s/p 5:54:10 } +2024-07-25 19:14:18,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 213/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.9984965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:18,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43525 samples/s/p 5:53:32 } +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 215/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9984682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43301 samples/s/p 5:53:38 } +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 217/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.9984394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43653 samples/s/p 5:53:21 } +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 219/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.9984103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43274 samples/s/p 5:53:33 } +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 221/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.998381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43695 samples/s/p 5:53:14 } +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 223/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9983512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43304 samples/s/p 5:53:26 } +2024-07-25 19:14:36,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 225/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9983215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43409 samples/s/p 5:53:19 } +2024-07-25 19:14:39,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 227/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9982915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43252 samples/s/p 5:53:22 } +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 229/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.9982612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43842 samples/s/p 5:52:56 } +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 231/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.9982306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42843 samples/s/p 5:53:32 } +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 233/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9981999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43351 samples/s/p 5:53:09 } +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 235/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.9981686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42833 samples/s/p 5:53:27 } +2024-07-25 19:14:54,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 237/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.998137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:54,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43677 samples/s/p 5:52:51 } +2024-07-25 19:14:57,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 239/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.9981054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:57,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.44085 samples/s/p 5:52:32 } +2024-07-25 19:15:00,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 241/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.9980733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:00,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43790 samples/s/p 5:52:41 } +2024-07-25 19:15:03,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 243/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.9980412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42767 samples/s/p 5:53:18 } +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 245/ 1625], loss: 1.279, per_step_time: 1474ms, lr: 2.9980087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42728 samples/s/p 5:53:16 } +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 247/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.997976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42790 samples/s/p 5:53:11 } +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 249/ 1625], loss: 1.375, per_step_time: 1472ms, lr: 2.9979428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43344 samples/s/p 5:52:46 } +2024-07-25 19:15:14,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 251/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.9979094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:14,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43273 samples/s/p 5:52:46 } +2024-07-25 19:15:17,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 253/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 2.9978759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43977 samples/s/p 5:52:16 } +2024-07-25 19:15:20,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 255/ 1625], loss: 1.137, per_step_time: 1469ms, lr: 2.997842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:20,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44232 samples/s/p 5:52:03 } +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 257/ 1625], loss: 1.338, per_step_time: 1472ms, lr: 2.9978082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43275 samples/s/p 5:52:37 } +2024-07-25 19:15:26,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 259/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.9977735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43767 samples/s/p 5:52:15 } +2024-07-25 19:15:29,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 261/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 2.997739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:29,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43881 samples/s/p 5:52:08 } +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 263/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.997704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43917 samples/s/p 5:52:03 } +2024-07-25 19:15:35,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 265/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9976689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43506 samples/s/p 5:52:16 } +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 267/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 2.9976336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43627 samples/s/p 5:52:09 } +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 269/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.9975978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43429 samples/s/p 5:52:13 } +2024-07-25 19:15:44,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 271/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9975616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43910 samples/s/p 5:51:52 } +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 273/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9975256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43614 samples/s/p 5:52:00 } +2024-07-25 19:15:50,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 275/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.997489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43510 samples/s/p 5:52:01 } +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 277/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.997452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43296 samples/s/p 5:52:07 } +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 279/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9974155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43252 samples/s/p 5:52:06 } +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 281/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.9973779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:59,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43795 samples/s/p 5:51:42 } +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 283/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.9973404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43659 samples/s/p 5:51:44 } +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 285/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.9973024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.44049 samples/s/p 5:51:26 } +2024-07-25 19:16:08,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 287/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.9972643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43515 samples/s/p 5:51:44 } +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 289/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.997226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.42799 samples/s/p 5:52:08 } +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 291/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.9971872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43153 samples/s/p 5:51:52 } +2024-07-25 19:16:16,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 293/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9971485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:16,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43312 samples/s/p 5:51:43 } +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 295/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.9971094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43183 samples/s/p 5:51:45 } +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 297/ 1625], loss: 0.980, per_step_time: 1471ms, lr: 2.9970697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43828 samples/s/p 5:51:17 } +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 299/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9970299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43860 samples/s/p 5:51:13 } +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 301/ 1625], loss: 1.029, per_step_time: 1473ms, lr: 2.9969902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42983 samples/s/p 5:51:44 } +2024-07-25 19:16:31,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 303/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.99695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:31,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42679 samples/s/p 5:51:53 } +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 305/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9969093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43579 samples/s/p 5:51:15 } +2024-07-25 19:16:37,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 307/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9968685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:37,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43935 samples/s/p 5:50:58 } +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 309/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9968276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43308 samples/s/p 5:51:19 } +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 311/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9967863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43859 samples/s/p 5:50:55 } +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 313/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 2.9967445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43094 samples/s/p 5:51:22 } +2024-07-25 19:16:49,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 315/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.9967028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:49,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44345 samples/s/p 5:50:30 } +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 317/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.9966604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42827 samples/s/p 5:51:26 } +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 319/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.9966182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43446 samples/s/p 5:50:59 } +2024-07-25 19:16:58,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9965757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43314 samples/s/p 5:51:01 } +2024-07-25 19:17:01,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 323/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9965326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:01,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42989 samples/s/p 5:51:11 } +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 325/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.9964896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.44057 samples/s/p 5:50:27 } +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 327/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.996446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.42741 samples/s/p 5:51:15 } +2024-07-25 19:17:10,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 329/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9964021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43743 samples/s/p 5:50:33 } +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 331/ 1625], loss: 0.962, per_step_time: 1471ms, lr: 2.9963583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43490 samples/s/p 5:50:40 } +2024-07-25 19:17:15,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 333/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.996314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43476 samples/s/p 5:50:37 } +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 335/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9962694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43451 samples/s/p 5:50:35 } +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 337/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.9962248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43084 samples/s/p 5:50:47 } +2024-07-25 19:17:24,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 339/ 1625], loss: 1.010, per_step_time: 1470ms, lr: 2.9961797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:24,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43908 samples/s/p 5:50:12 } +2024-07-25 19:17:27,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 341/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.9961344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43969 samples/s/p 5:50:07 } +2024-07-25 19:17:30,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 343/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.9960887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:30,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43352 samples/s/p 5:50:28 } +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 345/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.9960429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43750 samples/s/p 5:50:09 } +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 347/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.9959969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:36,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43270 samples/s/p 5:50:25 } +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 349/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9959503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43398 samples/s/p 5:50:17 } +2024-07-25 19:17:42,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 351/ 1625], loss: 1.294, per_step_time: 1470ms, lr: 2.9959036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43887 samples/s/p 5:49:55 } +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 353/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.995857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43228 samples/s/p 5:50:18 } +2024-07-25 19:17:48,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 355/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.9958097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:48,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43516 samples/s/p 5:50:03 } +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 357/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 2.9957622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43940 samples/s/p 5:49:44 } +2024-07-25 19:17:54,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 359/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.9957146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:54,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43142 samples/s/p 5:50:12 } +2024-07-25 19:17:57,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 361/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 2.9956665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:57,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43881 samples/s/p 5:49:41 } +2024-07-25 19:18:00,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 363/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.9956182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:00,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43485 samples/s/p 5:49:53 } +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 365/ 1625], loss: 1.378, per_step_time: 1472ms, lr: 2.9955698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43174 samples/s/p 5:50:02 } +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 367/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.995521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43666 samples/s/p 5:49:40 } +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 369/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.995472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43302 samples/s/p 5:49:51 } +2024-07-25 19:18:12,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 371/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9954224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43317 samples/s/p 5:49:48 } +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 373/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9953728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43244 samples/s/p 5:49:47 } +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 375/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.995323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43109 samples/s/p 5:49:50 } +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 377/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9952727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43252 samples/s/p 5:49:41 } +2024-07-25 19:18:23,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 379/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.9952223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43197 samples/s/p 5:49:40 } +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 381/ 1625], loss: 1.076, per_step_time: 1469ms, lr: 2.9951718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.44341 samples/s/p 5:48:53 } +2024-07-25 19:18:29,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 383/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.995121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:29,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43501 samples/s/p 5:49:23 } +2024-07-25 19:18:32,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 385/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.9950697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42869 samples/s/p 5:49:44 } +2024-07-25 19:18:35,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 387/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9950183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43845 samples/s/p 5:49:04 } +2024-07-25 19:18:38,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 389/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.9949666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:38,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43173 samples/s/p 5:49:27 } +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 391/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.9949146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43157 samples/s/p 5:49:24 } +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 393/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.9948624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42779 samples/s/p 5:49:36 } +2024-07-25 19:18:47,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 395/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.9948098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.44232 samples/s/p 5:48:37 } +2024-07-25 19:18:50,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 397/ 1625], loss: 1.052, per_step_time: 1474ms, lr: 2.9947569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42736 samples/s/p 5:49:32 } +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 399/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.9947041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43563 samples/s/p 5:48:57 } +2024-07-25 19:18:56,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 401/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.9946505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43543 samples/s/p 5:48:55 } +2024-07-25 19:18:59,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 403/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.994597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.44007 samples/s/p 5:48:34 } +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 405/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.994543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.42753 samples/s/p 5:49:19 } +2024-07-25 19:19:05,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 407/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 2.994489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:05,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43880 samples/s/p 5:48:33 } +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 409/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.9944347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43351 samples/s/p 5:48:50 } +2024-07-25 19:19:11,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 411/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 2.9943802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:11,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43932 samples/s/p 5:48:25 } +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 413/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9943252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43343 samples/s/p 5:48:45 } +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 415/ 1625], loss: 1.167, per_step_time: 1470ms, lr: 2.9942697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43951 samples/s/p 5:48:18 } +2024-07-25 19:19:19,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 417/ 1625], loss: 0.937, per_step_time: 1471ms, lr: 2.994214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:19,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43598 samples/s/p 5:48:29 } +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 419/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 2.9941586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42547 samples/s/p 5:49:07 } +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 421/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 2.9941026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44005 samples/s/p 5:48:08 } +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 423/ 1625], loss: 1.266, per_step_time: 1469ms, lr: 2.9940466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44402 samples/s/p 5:47:49 } +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 425/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.9939898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43792 samples/s/p 5:48:10 } +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 427/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9939329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42920 samples/s/p 5:48:40 } +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 429/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9938761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42956 samples/s/p 5:48:36 } +2024-07-25 19:19:40,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 431/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.9938186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43534 samples/s/p 5:48:11 } +2024-07-25 19:19:43,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 433/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9937613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43825 samples/s/p 5:47:57 } +2024-07-25 19:19:46,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 435/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9937031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43327 samples/s/p 5:48:13 } +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 437/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9936451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43564 samples/s/p 5:48:01 } +2024-07-25 19:19:52,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 439/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.9935867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:52,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43572 samples/s/p 5:47:58 } +2024-07-25 19:19:55,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.993528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:55,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.44229 samples/s/p 5:47:30 } +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 443/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9934692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43351 samples/s/p 5:48:00 } +2024-07-25 19:20:01,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 445/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.9934099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:01,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43457 samples/s/p 5:47:53 } +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 447/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.9933506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43135 samples/s/p 5:48:03 } +2024-07-25 19:20:07,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 449/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.9932908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:07,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43351 samples/s/p 5:47:51 } +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 451/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43335 samples/s/p 5:47:49 } +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 453/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9931705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43092 samples/s/p 5:47:56 } +2024-07-25 19:20:15,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 455/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.99311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:15,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43179 samples/s/p 5:47:49 } +2024-07-25 19:20:18,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 457/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.9930492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43633 samples/s/p 5:47:29 } +2024-07-25 19:20:21,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 459/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.992988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:21,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43215 samples/s/p 5:47:42 } +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 461/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9929268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.42475 samples/s/p 5:48:07 } +2024-07-25 19:20:27,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 463/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.9928653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.44074 samples/s/p 5:47:03 } +2024-07-25 19:20:30,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 465/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.9928033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.42892 samples/s/p 5:47:46 } +2024-07-25 19:20:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 467/ 1625], loss: 1.345, per_step_time: 1472ms, lr: 2.9927412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:33,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43461 samples/s/p 5:47:21 } +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 469/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9926789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43489 samples/s/p 5:47:17 } +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 471/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.9926163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43499 samples/s/p 5:47:13 } +2024-07-25 19:20:42,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 473/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 2.9925533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:42,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43772 samples/s/p 5:47:00 } +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 475/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.99249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.44479 samples/s/p 5:46:30 } +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 477/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.9924267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43701 samples/s/p 5:46:57 } +2024-07-25 19:20:51,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 479/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9923629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43799 samples/s/p 5:46:50 } +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 481/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.9922989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43214 samples/s/p 5:47:10 } +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 483/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.9922347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43265 samples/s/p 5:47:05 } +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 485/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.9921703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44005 samples/s/p 5:46:33 } +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 487/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 2.9921053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43096 samples/s/p 5:47:05 } +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 489/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9920404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43111 samples/s/p 5:47:02 } +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 491/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.991975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43536 samples/s/p 5:46:43 } +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 493/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.9919096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44160 samples/s/p 5:46:16 } +2024-07-25 19:21:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 495/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9918436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:14,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43103 samples/s/p 5:46:53 } +2024-07-25 19:21:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 497/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9917775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:17,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43824 samples/s/p 5:46:23 } +2024-07-25 19:21:20,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 499/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.9917113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:20,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43626 samples/s/p 5:46:27 } +2024-07-25 19:21:23,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 501/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.9916446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:23,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43721 samples/s/p 5:46:21 } +2024-07-25 19:21:26,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 503/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9915775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:26,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43310 samples/s/p 5:46:34 } +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 505/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9915103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43550 samples/s/p 5:46:21 } +2024-07-25 19:21:32,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 507/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.991443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43154 samples/s/p 5:46:34 } +2024-07-25 19:21:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 509/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9913752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:35,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43664 samples/s/p 5:46:11 } +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 511/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.9913072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43579 samples/s/p 5:46:11 } +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 513/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.991239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43379 samples/s/p 5:46:16 } +2024-07-25 19:21:44,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 515/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.9911704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:44,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43838 samples/s/p 5:45:56 } +2024-07-25 19:21:47,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 517/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.9911018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.42827 samples/s/p 5:46:31 } +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 519/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9910327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43614 samples/s/p 5:45:58 } +2024-07-25 19:21:53,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 521/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9909634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43241 samples/s/p 5:46:10 } +2024-07-25 19:21:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 523/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.9908939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43103 samples/s/p 5:46:12 } +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 525/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9908242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43661 samples/s/p 5:45:48 } +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 527/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.9907538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.44087 samples/s/p 5:45:29 } +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 529/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9906834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43087 samples/s/p 5:46:04 } +2024-07-25 19:22:08,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 531/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.9906128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:08,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43460 samples/s/p 5:45:47 } +2024-07-25 19:22:11,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 533/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.990542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.42878 samples/s/p 5:46:06 } +2024-07-25 19:22:14,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 535/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.9904708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43282 samples/s/p 5:45:47 } +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 537/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.9903993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43627 samples/s/p 5:45:31 } +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9903278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43339 samples/s/p 5:45:39 } +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 541/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9902556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43382 samples/s/p 5:45:35 } +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 543/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.9901834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43507 samples/s/p 5:45:27 } +2024-07-25 19:22:28,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 545/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 2.990111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:28,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44156 samples/s/p 5:44:59 } +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 547/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 2.990038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43225 samples/s/p 5:45:32 } +2024-07-25 19:22:34,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 549/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9899651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:34,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43447 samples/s/p 5:45:21 } +2024-07-25 19:22:37,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 551/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9898918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:37,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43116 samples/s/p 5:45:30 } +2024-07-25 19:22:40,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 553/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.9898185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:40,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43818 samples/s/p 5:45:01 } +2024-07-25 19:22:43,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 555/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.9897445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:43,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44031 samples/s/p 5:44:49 } +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 557/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9896704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43113 samples/s/p 5:45:22 } +2024-07-25 19:22:49,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 559/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9895962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.42829 samples/s/p 5:45:29 } +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 561/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9895215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43605 samples/s/p 5:44:57 } +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 563/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.9894465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.44037 samples/s/p 5:44:38 } +2024-07-25 19:22:58,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 565/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 2.9893716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:58,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43045 samples/s/p 5:45:12 } +2024-07-25 19:23:01,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 567/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.9892959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43606 samples/s/p 5:44:48 } +2024-07-25 19:23:04,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 569/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9892202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:04,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43526 samples/s/p 5:44:48 } +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 571/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.9891444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43555 samples/s/p 5:44:44 } +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 573/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9890682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43792 samples/s/p 5:44:32 } +2024-07-25 19:23:13,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 575/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9889916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43402 samples/s/p 5:44:44 } +2024-07-25 19:23:15,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 577/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9889148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:15,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43119 samples/s/p 5:44:52 } +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 579/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9888379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.44054 samples/s/p 5:44:13 } +2024-07-25 19:23:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 581/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9887606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:21,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43382 samples/s/p 5:44:36 } +2024-07-25 19:23:24,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 583/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.988683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43529 samples/s/p 5:44:27 } +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 585/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.9886052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43670 samples/s/p 5:44:19 } +2024-07-25 19:23:30,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 587/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 2.9885274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:30,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42989 samples/s/p 5:44:42 } +2024-07-25 19:23:33,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 589/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.9884488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:33,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43287 samples/s/p 5:44:28 } +2024-07-25 19:23:36,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 591/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9883704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:36,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43396 samples/s/p 5:44:21 } +2024-07-25 19:23:39,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 593/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 2.988291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42686 samples/s/p 5:44:45 } +2024-07-25 19:23:42,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 595/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.988212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:42,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43748 samples/s/p 5:44:01 } +2024-07-25 19:23:45,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 597/ 1625], loss: 1.282, per_step_time: 1473ms, lr: 2.9881328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:45,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43087 samples/s/p 5:44:24 } +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 599/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.9880532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.44002 samples/s/p 5:43:46 } +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 601/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.9879731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43482 samples/s/p 5:44:03 } +2024-07-25 19:23:54,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 603/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 2.9878931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:54,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43672 samples/s/p 5:43:53 } +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 605/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 2.9878125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43401 samples/s/p 5:44:00 } +2024-07-25 19:24:00,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 607/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.9877318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:00,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.42986 samples/s/p 5:44:13 } +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 609/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.987651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43215 samples/s/p 5:44:01 } +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 611/ 1625], loss: 1.324, per_step_time: 1473ms, lr: 2.9875695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43106 samples/s/p 5:44:02 } +2024-07-25 19:24:09,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 613/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9874882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:09,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43643 samples/s/p 5:43:39 } +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 615/ 1625], loss: 1.271, per_step_time: 1474ms, lr: 2.9874062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.42644 samples/s/p 5:44:14 } +2024-07-25 19:24:15,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 617/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9873243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43547 samples/s/p 5:43:37 } +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 619/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.9872419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43604 samples/s/p 5:43:32 } +2024-07-25 19:24:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 621/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.9871593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:20,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43586 samples/s/p 5:43:29 } +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 623/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9870764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43329 samples/s/p 5:43:36 } +2024-07-25 19:24:26,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 625/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.9869934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:26,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43214 samples/s/p 5:43:38 } +2024-07-25 19:24:29,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 627/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9869097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:29,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43308 samples/s/p 5:43:31 } +2024-07-25 19:24:32,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 629/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.986826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:32,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43483 samples/s/p 5:43:21 } +2024-07-25 19:24:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 631/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 2.9867424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:35,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42936 samples/s/p 5:43:39 } +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 633/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.986658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43490 samples/s/p 5:43:15 } +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 635/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 2.9865738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43902 samples/s/p 5:42:57 } +2024-07-25 19:24:44,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 637/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.986489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43683 samples/s/p 5:43:02 } +2024-07-25 19:24:47,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 639/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9864039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:47,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.44095 samples/s/p 5:42:44 } +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 641/ 1625], loss: 1.287, per_step_time: 1474ms, lr: 2.9863188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42464 samples/s/p 5:43:42 } +2024-07-25 19:24:53,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 643/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9862333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43213 samples/s/p 5:43:11 } +2024-07-25 19:24:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 645/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.9861474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:56,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43525 samples/s/p 5:42:56 } +2024-07-25 19:24:59,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 2.9860614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.44150 samples/s/p 5:42:30 } +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 649/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9859752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43573 samples/s/p 5:42:49 } +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9858886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43501 samples/s/p 5:42:48 } +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 653/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.9858018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43435 samples/s/p 5:42:48 } +2024-07-25 19:25:11,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 655/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 2.9857147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:11,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43744 samples/s/p 5:42:33 } +2024-07-25 19:25:14,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 657/ 1625], loss: 1.191, per_step_time: 1476ms, lr: 2.9856272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:14,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.41983 samples/s/p 5:43:37 } +2024-07-25 19:25:17,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 659/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.9855397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43624 samples/s/p 5:42:32 } +2024-07-25 19:25:19,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 661/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9854516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43438 samples/s/p 5:42:36 } +2024-07-25 19:25:22,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 663/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.9853638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:22,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42837 samples/s/p 5:42:56 } +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 665/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.9852752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42976 samples/s/p 5:42:48 } +2024-07-25 19:25:28,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 667/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.9851866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:28,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43586 samples/s/p 5:42:22 } +2024-07-25 19:25:31,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 669/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.9850975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:31,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43195 samples/s/p 5:42:33 } +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 671/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.9850084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43827 samples/s/p 5:42:07 } +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 673/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.984919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43263 samples/s/p 5:42:25 } +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 675/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.9848292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43405 samples/s/p 5:42:17 } +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 677/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.984739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43110 samples/s/p 5:42:25 } +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 679/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 2.9846487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:46,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43432 samples/s/p 5:42:10 } +2024-07-25 19:25:49,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 681/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.9845582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.42922 samples/s/p 5:42:26 } +2024-07-25 19:25:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 683/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 2.9844676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43227 samples/s/p 5:42:12 } +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 685/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.9843766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43761 samples/s/p 5:41:49 } +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 687/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.9842851e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43806 samples/s/p 5:41:44 } +2024-07-25 19:26:01,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 689/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9841935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:01,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43200 samples/s/p 5:42:04 } +2024-07-25 19:26:04,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 691/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 2.9841016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43104 samples/s/p 5:42:05 } +2024-07-25 19:26:07,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 693/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9840096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43476 samples/s/p 5:41:47 } +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 695/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 2.9839173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42873 samples/s/p 5:42:07 } +2024-07-25 19:26:13,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 697/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9838244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:13,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43309 samples/s/p 5:41:48 } +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 699/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.9837316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42864 samples/s/p 5:42:02 } +2024-07-25 19:26:18,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 701/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9836385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:18,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43718 samples/s/p 5:41:27 } +2024-07-25 19:26:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 703/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.9835448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:21,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.44132 samples/s/p 5:41:08 } +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 705/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.9834513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43312 samples/s/p 5:41:36 } +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 707/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9833573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43331 samples/s/p 5:41:32 } +2024-07-25 19:26:30,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 709/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.9832629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:30,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.42998 samples/s/p 5:41:42 } +2024-07-25 19:26:33,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 711/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.9831685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:33,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43123 samples/s/p 5:41:34 } +2024-07-25 19:26:36,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 713/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9830737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:36,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43313 samples/s/p 5:41:24 } +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 715/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.9829787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43520 samples/s/p 5:41:13 } +2024-07-25 19:26:42,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 717/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.9828832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43354 samples/s/p 5:41:17 } +2024-07-25 19:26:45,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 719/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.982788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:45,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43530 samples/s/p 5:41:07 } +2024-07-25 19:26:48,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 721/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.982692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43170 samples/s/p 5:41:18 } +2024-07-25 19:26:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 723/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.982596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43187 samples/s/p 5:41:14 } +2024-07-25 19:26:54,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 725/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 2.9824996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43107 samples/s/p 5:41:14 } +2024-07-25 19:26:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 727/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.9824028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43157 samples/s/p 5:41:09 } +2024-07-25 19:27:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 729/ 1625], loss: 1.359, per_step_time: 1474ms, lr: 2.9823059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42722 samples/s/p 5:41:23 } +2024-07-25 19:27:03,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 731/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.9822088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:03,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43518 samples/s/p 5:40:50 } +2024-07-25 19:27:06,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 733/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9821114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:06,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43376 samples/s/p 5:40:52 } +2024-07-25 19:27:09,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 735/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9820138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43799 samples/s/p 5:40:34 } +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 737/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9819159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43378 samples/s/p 5:40:46 } +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 739/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9818177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42963 samples/s/p 5:40:59 } +2024-07-25 19:27:18,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 741/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9817189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:18,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43141 samples/s/p 5:40:49 } +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 743/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.9816205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43354 samples/s/p 5:40:38 } +2024-07-25 19:27:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 745/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.9815214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:23,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.44119 samples/s/p 5:40:07 } +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 747/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.9814222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43333 samples/s/p 5:40:33 } +2024-07-25 19:27:29,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 749/ 1625], loss: 1.235, per_step_time: 1474ms, lr: 2.9813224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42677 samples/s/p 5:40:55 } +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 751/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.9812229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42497 samples/s/p 5:40:59 } +2024-07-25 19:27:35,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 753/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9811226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:35,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43253 samples/s/p 5:40:28 } +2024-07-25 19:27:38,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 755/ 1625], loss: 1.218, per_step_time: 1481ms, lr: 2.9810224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.39900 samples/s/p 5:42:31 } +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 757/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9809218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43083 samples/s/p 5:40:28 } +2024-07-25 19:27:44,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 759/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.9808209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43012 samples/s/p 5:40:28 } +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 761/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 2.98072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43096 samples/s/p 5:40:22 } +2024-07-25 19:27:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 763/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9806186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43005 samples/s/p 5:40:22 } +2024-07-25 19:27:53,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 765/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9805167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:53,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43532 samples/s/p 5:39:59 } +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 767/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.9804149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43297 samples/s/p 5:40:05 } +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 769/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.9803128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42830 samples/s/p 5:40:20 } +2024-07-25 19:28:02,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 771/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.9802102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:02,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43050 samples/s/p 5:40:09 } +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 773/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.9801076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43359 samples/s/p 5:39:54 } +2024-07-25 19:28:08,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 775/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.9800045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:08,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44296 samples/s/p 5:39:16 } +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 777/ 1625], loss: 1.292, per_step_time: 1474ms, lr: 2.9799015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42620 samples/s/p 5:40:16 } +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 779/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.9797979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44157 samples/s/p 5:39:15 } +2024-07-25 19:28:17,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 781/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.9796942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43482 samples/s/p 5:39:38 } +2024-07-25 19:28:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 783/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9795901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42934 samples/s/p 5:39:55 } +2024-07-25 19:28:23,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 785/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9794859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43444 samples/s/p 5:39:33 } +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 787/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9793813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42860 samples/s/p 5:39:52 } +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 789/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9792765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43636 samples/s/p 5:39:20 } +2024-07-25 19:28:31,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 791/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9791714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:31,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43272 samples/s/p 5:39:31 } +2024-07-25 19:28:34,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 793/ 1625], loss: 0.885, per_step_time: 1469ms, lr: 2.979066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:34,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.44261 samples/s/p 5:38:51 } +2024-07-25 19:28:37,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 795/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9789604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:37,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43683 samples/s/p 5:39:10 } +2024-07-25 19:28:40,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 797/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9788547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:40,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43426 samples/s/p 5:39:16 } +2024-07-25 19:28:43,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 799/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9787485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:43,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43562 samples/s/p 5:39:08 } +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 801/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 2.978642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43354 samples/s/p 5:39:13 } +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 803/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9785355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43886 samples/s/p 5:38:50 } +2024-07-25 19:28:52,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 805/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9784285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:52,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43739 samples/s/p 5:38:53 } +2024-07-25 19:28:55,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 807/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9783214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:55,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43666 samples/s/p 5:38:53 } +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 809/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9782139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43443 samples/s/p 5:38:58 } +2024-07-25 19:29:01,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 811/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.9781062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43753 samples/s/p 5:38:43 } +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 813/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.9779982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.42854 samples/s/p 5:39:14 } +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 815/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.97789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43472 samples/s/p 5:38:48 } +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 817/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9777813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43154 samples/s/p 5:38:57 } +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 819/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.9776727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43424 samples/s/p 5:38:44 } +2024-07-25 19:29:16,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 821/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.9775636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:16,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43423 samples/s/p 5:38:41 } +2024-07-25 19:29:19,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 823/ 1625], loss: 1.268, per_step_time: 1470ms, lr: 2.9774543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:19,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43850 samples/s/p 5:38:22 } +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 825/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9773448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.44149 samples/s/p 5:38:08 } +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 827/ 1625], loss: 1.146, per_step_time: 1477ms, lr: 2.977235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.41458 samples/s/p 5:39:46 } +2024-07-25 19:29:27,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 829/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.9771249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43912 samples/s/p 5:38:11 } +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 831/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.9770146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43587 samples/s/p 5:38:20 } +2024-07-25 19:29:33,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 833/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.9769039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.42992 samples/s/p 5:38:39 } +2024-07-25 19:29:36,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 835/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.9767929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:36,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43871 samples/s/p 5:38:04 } +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 837/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 2.976682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42903 samples/s/p 5:38:37 } +2024-07-25 19:29:42,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 839/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.9765704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:42,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43573 samples/s/p 5:38:09 } +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 841/ 1625], loss: 0.965, per_step_time: 1472ms, lr: 2.9764587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43285 samples/s/p 5:38:17 } +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 843/ 1625], loss: 1.341, per_step_time: 1470ms, lr: 2.976347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.44055 samples/s/p 5:37:45 } +2024-07-25 19:29:51,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 845/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9762348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43036 samples/s/p 5:38:20 } +2024-07-25 19:29:54,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 847/ 1625], loss: 1.444, per_step_time: 1471ms, lr: 2.9761222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:54,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43538 samples/s/p 5:37:59 } +2024-07-25 19:29:57,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 849/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9760096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:57,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43278 samples/s/p 5:38:05 } +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 851/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.9758965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43413 samples/s/p 5:37:57 } +2024-07-25 19:30:03,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 853/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9757832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42971 samples/s/p 5:38:11 } +2024-07-25 19:30:06,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 855/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.9756698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:06,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43646 samples/s/p 5:37:43 } +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 857/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.975556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43408 samples/s/p 5:37:49 } +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 859/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.975442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43609 samples/s/p 5:37:38 } +2024-07-25 19:30:15,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 861/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9753279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:15,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43405 samples/s/p 5:37:43 } +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 863/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9752133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42901 samples/s/p 5:37:59 } +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 865/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9750983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42582 samples/s/p 5:38:08 } +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 867/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9749832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43702 samples/s/p 5:37:23 } +2024-07-25 19:30:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 869/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.9748679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43566 samples/s/p 5:37:25 } +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 871/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.9747522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44182 samples/s/p 5:36:59 } +2024-07-25 19:30:32,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 873/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.9746365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:32,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43611 samples/s/p 5:37:18 } +2024-07-25 19:30:35,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 875/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 2.9745202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43930 samples/s/p 5:37:03 } +2024-07-25 19:30:38,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 877/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9744038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43444 samples/s/p 5:37:18 } +2024-07-25 19:30:41,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 879/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9742872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:41,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43405 samples/s/p 5:37:16 } +2024-07-25 19:30:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 881/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9741705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:44,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43621 samples/s/p 5:37:05 } +2024-07-25 19:30:47,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 883/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 2.9740533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:47,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43634 samples/s/p 5:37:02 } +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 885/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 2.9739356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44157 samples/s/p 5:36:40 } +2024-07-25 19:30:53,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 887/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9738178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43506 samples/s/p 5:37:01 } +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 889/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.9736999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43749 samples/s/p 5:36:49 } +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 891/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9735816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43100 samples/s/p 5:37:10 } +2024-07-25 19:31:02,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 893/ 1625], loss: 1.258, per_step_time: 1474ms, lr: 2.973463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:02,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42662 samples/s/p 5:37:23 } +2024-07-25 19:31:05,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 895/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.9733445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:05,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43785 samples/s/p 5:36:39 } +2024-07-25 19:31:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 897/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.9732257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.44047 samples/s/p 5:36:26 } +2024-07-25 19:31:11,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 899/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.973106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43150 samples/s/p 5:36:56 } +2024-07-25 19:31:14,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 901/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 2.9729865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42893 samples/s/p 5:37:03 } +2024-07-25 19:31:17,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 903/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9728668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:17,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43540 samples/s/p 5:36:36 } +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 905/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9727466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43535 samples/s/p 5:36:33 } +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 907/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9726263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43615 samples/s/p 5:36:27 } +2024-07-25 19:31:25,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 909/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9725057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:25,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43238 samples/s/p 5:36:38 } +2024-07-25 19:31:28,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 911/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.972385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43930 samples/s/p 5:36:10 } +2024-07-25 19:31:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 913/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.9722638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:31,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43553 samples/s/p 5:36:21 } +2024-07-25 19:31:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 915/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9721425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:34,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.42950 samples/s/p 5:36:40 } +2024-07-25 19:31:37,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 917/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9720208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43717 samples/s/p 5:36:09 } +2024-07-25 19:31:40,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 919/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9718987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.44076 samples/s/p 5:35:53 } +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 921/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9717767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43614 samples/s/p 5:36:07 } +2024-07-25 19:31:46,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 923/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9716544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43347 samples/s/p 5:36:14 } +2024-07-25 19:31:49,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 925/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9715315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43229 samples/s/p 5:36:15 } +2024-07-25 19:31:52,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 927/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.9714083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:52,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43565 samples/s/p 5:36:00 } +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 929/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 2.9712852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43327 samples/s/p 5:36:06 } +2024-07-25 19:31:58,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 931/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.9711617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:58,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43426 samples/s/p 5:35:59 } +2024-07-25 19:32:01,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 933/ 1625], loss: 1.436, per_step_time: 1474ms, lr: 2.971038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.42684 samples/s/p 5:36:24 } +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 935/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9709141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.42984 samples/s/p 5:36:10 } +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 937/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43674 samples/s/p 5:35:41 } +2024-07-25 19:32:10,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 939/ 1625], loss: 1.044, per_step_time: 1481ms, lr: 2.9706653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:10,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.39927 samples/s/p 5:37:58 } +2024-07-25 19:32:13,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 941/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9705405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:13,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43751 samples/s/p 5:35:32 } +2024-07-25 19:32:16,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 943/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9704153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43273 samples/s/p 5:35:47 } +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 945/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.9702898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43626 samples/s/p 5:35:31 } +2024-07-25 19:32:22,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 947/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9701643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:22,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43827 samples/s/p 5:35:21 } +2024-07-25 19:32:25,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 949/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.9700386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:25,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43435 samples/s/p 5:35:32 } +2024-07-25 19:32:27,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 951/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.9699124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:27,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43179 samples/s/p 5:35:39 } +2024-07-25 19:32:30,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 953/ 1625], loss: 1.263, per_step_time: 1474ms, lr: 2.9697861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:30,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42713 samples/s/p 5:35:53 } +2024-07-25 19:32:33,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 955/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9696595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:33,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43658 samples/s/p 5:35:15 } +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 957/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9695326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42902 samples/s/p 5:35:40 } +2024-07-25 19:32:39,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 959/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9694054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43225 samples/s/p 5:35:25 } +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 961/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 2.969278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43030 samples/s/p 5:35:29 } +2024-07-25 19:32:45,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.9691504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43018 samples/s/p 5:35:27 } +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 965/ 1625], loss: 1.397, per_step_time: 1483ms, lr: 2.9690224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.39162 samples/s/p 5:37:48 } +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 967/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9688941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43518 samples/s/p 5:35:03 } +2024-07-25 19:32:54,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 969/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.9687657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43576 samples/s/p 5:34:58 } +2024-07-25 19:32:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 971/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.9686367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:57,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43292 samples/s/p 5:35:05 } +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 973/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9685078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43305 samples/s/p 5:35:02 } +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 975/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 2.9683788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43859 samples/s/p 5:34:38 } +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 977/ 1625], loss: 1.140, per_step_time: 1474ms, lr: 2.9682491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.42614 samples/s/p 5:35:21 } +2024-07-25 19:33:09,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 979/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.9681194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:09,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43756 samples/s/p 5:34:36 } +2024-07-25 19:33:12,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 981/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.9679892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43776 samples/s/p 5:34:32 } +2024-07-25 19:33:15,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 983/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.967859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:15,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43151 samples/s/p 5:34:53 } +2024-07-25 19:33:18,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 985/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.9677285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:18,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43276 samples/s/p 5:34:45 } +2024-07-25 19:33:21,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 987/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.9675975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:21,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43275 samples/s/p 5:34:42 } +2024-07-25 19:33:24,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 989/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 2.9674666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43377 samples/s/p 5:34:35 } +2024-07-25 19:33:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 991/ 1625], loss: 1.347, per_step_time: 1471ms, lr: 2.967335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:27,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43726 samples/s/p 5:34:20 } +2024-07-25 19:33:29,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 993/ 1625], loss: 1.390, per_step_time: 1472ms, lr: 2.9672035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43477 samples/s/p 5:34:26 } +2024-07-25 19:33:32,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 995/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.9670717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:32,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43872 samples/s/p 5:34:08 } +2024-07-25 19:33:35,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 997/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.9669396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43304 samples/s/p 5:34:26 } +2024-07-25 19:33:38,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 999/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 2.9668072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:38,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43723 samples/s/p 5:34:08 } +2024-07-25 19:33:41,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1001/ 1625], loss: 0.931, per_step_time: 1471ms, lr: 2.9666744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:41,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43603 samples/s/p 5:34:09 } +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1003/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9665418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43574 samples/s/p 5:34:08 } +2024-07-25 19:33:47,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1005/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9664083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:47,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42873 samples/s/p 5:34:30 } +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1007/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 2.966275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.44390 samples/s/p 5:33:32 } +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1009/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9661414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43497 samples/s/p 5:34:02 } +2024-07-25 19:33:56,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1011/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9660072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:56,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43556 samples/s/p 5:33:56 } +2024-07-25 19:33:59,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1013/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9658731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:59,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42864 samples/s/p 5:34:19 } +2024-07-25 19:34:02,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1015/ 1625], loss: 1.301, per_step_time: 1473ms, lr: 2.9657387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:02,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42832 samples/s/p 5:34:17 } +2024-07-25 19:34:05,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1017/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.9656037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:05,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43304 samples/s/p 5:33:57 } +2024-07-25 19:34:08,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1019/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 2.9654688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.44039 samples/s/p 5:33:27 } +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1021/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9653334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43017 samples/s/p 5:34:02 } +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1023/ 1625], loss: 1.089, per_step_time: 1473ms, lr: 2.9651981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43095 samples/s/p 5:33:56 } +2024-07-25 19:34:17,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1025/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.965062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43385 samples/s/p 5:33:42 } +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1027/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 2.964926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43085 samples/s/p 5:33:50 } +2024-07-25 19:34:23,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1029/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.9647897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:23,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43349 samples/s/p 5:33:38 } +2024-07-25 19:34:26,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1031/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9646533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:26,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43164 samples/s/p 5:33:41 } +2024-07-25 19:34:29,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1033/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9645162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:29,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43295 samples/s/p 5:33:34 } +2024-07-25 19:34:31,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1035/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 2.9643794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:31,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.42920 samples/s/p 5:33:45 } +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1037/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.964242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43494 samples/s/p 5:33:20 } +2024-07-25 19:34:37,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1039/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.9641044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43201 samples/s/p 5:33:28 } +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1041/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9639665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43260 samples/s/p 5:33:23 } +2024-07-25 19:34:43,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1043/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9638284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:43,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43533 samples/s/p 5:33:10 } +2024-07-25 19:34:46,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1045/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.96369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.42905 samples/s/p 5:33:30 } +2024-07-25 19:34:49,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1047/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.9635514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:49,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43492 samples/s/p 5:33:06 } +2024-07-25 19:34:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1049/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.9634124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:52,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43799 samples/s/p 5:32:52 } +2024-07-25 19:34:55,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1051/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.963273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43437 samples/s/p 5:33:02 } +2024-07-25 19:34:58,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1053/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9631337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43684 samples/s/p 5:32:50 } +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1055/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.962994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44101 samples/s/p 5:32:32 } +2024-07-25 19:35:04,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1057/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.962854e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:04,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43954 samples/s/p 5:32:34 } +2024-07-25 19:35:07,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1059/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 2.9627137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:07,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43595 samples/s/p 5:32:44 } +2024-07-25 19:35:10,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1061/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9625733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43156 samples/s/p 5:32:58 } +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1063/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.9624325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43817 samples/s/p 5:32:30 } +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1065/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.9622914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43394 samples/s/p 5:32:43 } +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1067/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9621502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43439 samples/s/p 5:32:38 } +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1069/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9620089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43332 samples/s/p 5:32:39 } +2024-07-25 19:35:25,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1071/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.961867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:25,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43576 samples/s/p 5:32:27 } +2024-07-25 19:35:28,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1073/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.961725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:28,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43548 samples/s/p 5:32:25 } +2024-07-25 19:35:30,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1075/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9615825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:30,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43364 samples/s/p 5:32:29 } +2024-07-25 19:35:33,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1077/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9614399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:33,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.44166 samples/s/p 5:31:57 } +2024-07-25 19:35:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1079/ 1625], loss: 1.244, per_step_time: 1475ms, lr: 2.961297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.42032 samples/s/p 5:33:12 } +2024-07-25 19:35:39,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1081/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9611541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43041 samples/s/p 5:32:32 } +2024-07-25 19:35:42,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1083/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9610108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:42,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43543 samples/s/p 5:32:11 } +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1085/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.960867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43425 samples/s/p 5:32:12 } +2024-07-25 19:35:48,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1087/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 2.9607232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43735 samples/s/p 5:31:58 } +2024-07-25 19:35:51,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1089/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.960579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43728 samples/s/p 5:31:55 } +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1091/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.9604347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43430 samples/s/p 5:32:03 } +2024-07-25 19:35:57,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1093/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.96029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:57,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43052 samples/s/p 5:32:14 } +2024-07-25 19:36:00,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1095/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.9601451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43286 samples/s/p 5:32:03 } +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1097/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.96e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43357 samples/s/p 5:31:57 } +2024-07-25 19:36:06,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1099/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.9598543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42662 samples/s/p 5:32:20 } +2024-07-25 19:36:09,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1101/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9597088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:09,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43973 samples/s/p 5:31:29 } +2024-07-25 19:36:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1103/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9595627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42735 samples/s/p 5:32:11 } +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1105/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.9594165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43505 samples/s/p 5:31:40 } +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1107/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9592702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43140 samples/s/p 5:31:50 } +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1109/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.9591232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42859 samples/s/p 5:31:58 } +2024-07-25 19:36:24,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.9589763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:24,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43084 samples/s/p 5:31:47 } +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1113/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 2.958829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42945 samples/s/p 5:31:49 } +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1115/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.9586816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43936 samples/s/p 5:31:09 } +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1117/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.9585337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43149 samples/s/p 5:31:35 } +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1119/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9583858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43298 samples/s/p 5:31:27 } +2024-07-25 19:36:38,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1121/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9582376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43337 samples/s/p 5:31:23 } +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1123/ 1625], loss: 1.430, per_step_time: 1471ms, lr: 2.9580888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43605 samples/s/p 5:31:10 } +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1125/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.95794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43478 samples/s/p 5:31:12 } +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1127/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.9577908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.44537 samples/s/p 5:30:30 } +2024-07-25 19:36:50,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1129/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9576418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:50,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.42999 samples/s/p 5:31:23 } +2024-07-25 19:36:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9574921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43469 samples/s/p 5:31:03 } +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1133/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.957342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43037 samples/s/p 5:31:16 } +2024-07-25 19:36:59,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1135/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.957192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43721 samples/s/p 5:30:48 } +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1137/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.9570418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43910 samples/s/p 5:30:38 } +2024-07-25 19:37:05,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1139/ 1625], loss: 1.414, per_step_time: 1472ms, lr: 2.9568911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:05,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43460 samples/s/p 5:30:52 } +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1141/ 1625], loss: 1.430, per_step_time: 1472ms, lr: 2.9567402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43316 samples/s/p 5:30:54 } +2024-07-25 19:37:11,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1143/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9565892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:11,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43433 samples/s/p 5:30:47 } +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1145/ 1625], loss: 1.254, per_step_time: 1469ms, lr: 2.9564375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.44293 samples/s/p 5:30:12 } +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1147/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.956286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43508 samples/s/p 5:30:38 } +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9561339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42849 samples/s/p 5:30:59 } +2024-07-25 19:37:23,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1151/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.9559818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:23,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43430 samples/s/p 5:30:35 } +2024-07-25 19:37:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1153/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.9558292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42922 samples/s/p 5:30:51 } +2024-07-25 19:37:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1155/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9556764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:29,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43530 samples/s/p 5:30:25 } +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1157/ 1625], loss: 1.392, per_step_time: 1473ms, lr: 2.9555236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43011 samples/s/p 5:30:41 } +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1159/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9553703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43639 samples/s/p 5:30:16 } +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1161/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.955217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42884 samples/s/p 5:30:40 } +2024-07-25 19:37:40,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1163/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 2.9550632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.44253 samples/s/p 5:29:47 } +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1165/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.954909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.42862 samples/s/p 5:30:35 } +2024-07-25 19:37:46,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1167/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.954755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:46,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43498 samples/s/p 5:30:09 } +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1169/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9546003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43545 samples/s/p 5:30:04 } +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1171/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.9544455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43424 samples/s/p 5:30:06 } +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1173/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9542905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43344 samples/s/p 5:30:06 } +2024-07-25 19:37:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1175/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.954135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43399 samples/s/p 5:30:01 } +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:38:34,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1177/ 1625], loss: 1.273, per_step_time: 2748ms, lr: 2.9539795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:34,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 2.91021 samples/s/p 10:16:07 } +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1179/ 1625], loss: 1.146, per_step_time: 1478ms, lr: 2.9538238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.41166 samples/s/p 5:31:17 } +2024-07-25 19:38:40,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1181/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 2.9536677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:40,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43152 samples/s/p 5:30:01 } +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1183/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9535113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42394 samples/s/p 5:30:26 } +2024-07-25 19:38:46,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1185/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.9533547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:46,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43173 samples/s/p 5:29:54 } +2024-07-25 19:38:48,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1187/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9531979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:48,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43280 samples/s/p 5:29:47 } +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1189/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9530409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43815 samples/s/p 5:29:25 } +2024-07-25 19:38:54,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1191/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.9528832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43734 samples/s/p 5:29:25 } +2024-07-25 19:38:57,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1193/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.9527255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:57,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42748 samples/s/p 5:29:58 } +2024-07-25 19:39:00,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1195/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 2.952568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:00,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42927 samples/s/p 5:29:49 } +2024-07-25 19:39:03,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1197/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.9524095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:03,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43078 samples/s/p 5:29:40 } +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1199/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 2.9522513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43098 samples/s/p 5:29:36 } +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1201/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 2.9520925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42274 samples/s/p 5:30:03 } +2024-07-25 19:39:12,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1203/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.9519335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.44118 samples/s/p 5:28:53 } +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1205/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.9517743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42892 samples/s/p 5:29:35 } +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1207/ 1625], loss: 1.056, per_step_time: 1474ms, lr: 2.951615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42616 samples/s/p 5:29:42 } +2024-07-25 19:39:21,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1209/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9514551e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:21,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43127 samples/s/p 5:29:21 } +2024-07-25 19:39:24,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1211/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.9512954e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:24,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43787 samples/s/p 5:28:54 } +2024-07-25 19:39:27,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1213/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.951135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:27,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43312 samples/s/p 5:29:08 } +2024-07-25 19:39:30,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1215/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.9509745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:30,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43921 samples/s/p 5:28:43 } +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1217/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9508139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43439 samples/s/p 5:28:57 } +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1219/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.950653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42669 samples/s/p 5:29:23 } +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1221/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9504916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42787 samples/s/p 5:29:15 } +2024-07-25 19:39:42,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1223/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.95033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:42,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43121 samples/s/p 5:29:00 } +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1225/ 1625], loss: 1.107, per_step_time: 1474ms, lr: 2.9501683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:45,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42602 samples/s/p 5:29:16 } +2024-07-25 19:39:48,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1227/ 1625], loss: 1.176, per_step_time: 1475ms, lr: 2.9500063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:48,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42312 samples/s/p 5:29:24 } +2024-07-25 19:39:50,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1229/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9498437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:50,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43176 samples/s/p 5:28:49 } +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1231/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.9496812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:53,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43115 samples/s/p 5:28:49 } +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1233/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9495186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43393 samples/s/p 5:28:36 } +2024-07-25 19:39:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1235/ 1625], loss: 1.037, per_step_time: 1473ms, lr: 2.9493556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42853 samples/s/p 5:28:52 } +2024-07-25 19:40:02,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1237/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9491921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:02,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42694 samples/s/p 5:28:55 } +2024-07-25 19:40:05,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1239/ 1625], loss: 1.031, per_step_time: 1487ms, lr: 2.9490286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.37774 samples/s/p 5:31:53 } +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1241/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9488647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42624 samples/s/p 5:28:52 } +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1243/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9487004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43693 samples/s/p 5:28:10 } +2024-07-25 19:40:14,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 2.9485363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:14,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42427 samples/s/p 5:28:53 } +2024-07-25 19:40:17,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1247/ 1625], loss: 1.194, per_step_time: 1476ms, lr: 2.9483715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:17,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.41816 samples/s/p 5:29:12 } +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1249/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9482066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43661 samples/s/p 5:28:02 } +2024-07-25 19:40:23,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1251/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.9480416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43549 samples/s/p 5:28:03 } +2024-07-25 19:40:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1253/ 1625], loss: 1.152, per_step_time: 1474ms, lr: 2.9478762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:26,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42565 samples/s/p 5:28:36 } +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1255/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 2.9477103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42409 samples/s/p 5:28:39 } +2024-07-25 19:40:32,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1257/ 1625], loss: 1.254, per_step_time: 1473ms, lr: 2.9475446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42809 samples/s/p 5:28:21 } +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1259/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.9473786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43258 samples/s/p 5:28:02 } +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1261/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.947212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43039 samples/s/p 5:28:07 } +2024-07-25 19:40:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1263/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.9470451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43671 samples/s/p 5:27:41 } +2024-07-25 19:40:44,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1265/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.9468785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:44,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43621 samples/s/p 5:27:40 } +2024-07-25 19:40:47,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1267/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9467114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:47,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43580 samples/s/p 5:27:39 } +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1269/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9465436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43256 samples/s/p 5:27:48 } +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1271/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9463761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43182 samples/s/p 5:27:47 } +2024-07-25 19:40:55,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1273/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9462082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43766 samples/s/p 5:27:23 } +2024-07-25 19:40:58,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1275/ 1625], loss: 1.209, per_step_time: 1475ms, lr: 2.94604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:58,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.42328 samples/s/p 5:28:12 } +2024-07-25 19:41:01,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1277/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.9458712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:01,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44033 samples/s/p 5:27:08 } +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1279/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.9457025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43307 samples/s/p 5:27:31 } +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1281/ 1625], loss: 1.315, per_step_time: 1474ms, lr: 2.9455336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.42582 samples/s/p 5:27:54 } +2024-07-25 19:41:10,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1283/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9453642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43222 samples/s/p 5:27:28 } +2024-07-25 19:41:13,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1285/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9451949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43911 samples/s/p 5:27:00 } +2024-07-25 19:41:16,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1287/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 2.945025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43880 samples/s/p 5:26:59 } +2024-07-25 19:41:19,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1289/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.944855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:19,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43097 samples/s/p 5:27:24 } +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1291/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.9446848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44186 samples/s/p 5:26:42 } +2024-07-25 19:41:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1293/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9445142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:25,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43121 samples/s/p 5:27:17 } +2024-07-25 19:41:28,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1295/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.9443434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43507 samples/s/p 5:27:00 } +2024-07-25 19:41:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1297/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.9441722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.42865 samples/s/p 5:27:20 } +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1299/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.9440009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43400 samples/s/p 5:26:58 } +2024-07-25 19:41:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1301/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.9438293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43924 samples/s/p 5:26:36 } +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1303/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.9436576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.42795 samples/s/p 5:27:14 } +2024-07-25 19:41:43,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1305/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9434856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43771 samples/s/p 5:26:36 } +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1307/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.943313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:46,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43593 samples/s/p 5:26:39 } +2024-07-25 19:41:49,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1309/ 1625], loss: 1.163, per_step_time: 1469ms, lr: 2.9431405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44219 samples/s/p 5:26:14 } +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1311/ 1625], loss: 1.217, per_step_time: 1469ms, lr: 2.9429677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44386 samples/s/p 5:26:05 } +2024-07-25 19:41:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1313/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.9427943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:55,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43497 samples/s/p 5:26:34 } +2024-07-25 19:41:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.9426212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43466 samples/s/p 5:26:32 } +2024-07-25 19:42:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1317/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.9424475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.42970 samples/s/p 5:26:47 } +2024-07-25 19:42:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1319/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9422736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:03,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43874 samples/s/p 5:26:12 } +2024-07-25 19:42:06,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1321/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 2.9420993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:06,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43239 samples/s/p 5:26:32 } +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1323/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 2.941925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43130 samples/s/p 5:26:33 } +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1325/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.9417504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43514 samples/s/p 5:26:16 } +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1327/ 1625], loss: 1.301, per_step_time: 1473ms, lr: 2.9415754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43040 samples/s/p 5:26:30 } +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1329/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9414003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43793 samples/s/p 5:26:00 } +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1331/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.941225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43857 samples/s/p 5:25:55 } +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1333/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.941049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43154 samples/s/p 5:26:17 } +2024-07-25 19:42:27,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1335/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9408731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:27,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43203 samples/s/p 5:26:12 } +2024-07-25 19:42:30,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1337/ 1625], loss: 1.186, per_step_time: 1480ms, lr: 2.940697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.40320 samples/s/p 5:27:54 } +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1339/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9405206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43336 samples/s/p 5:26:02 } +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1341/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.9403436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43470 samples/s/p 5:25:54 } +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1343/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9401668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42595 samples/s/p 5:26:22 } +2024-07-25 19:42:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1345/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.9399896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43018 samples/s/p 5:26:04 } +2024-07-25 19:42:45,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1347/ 1625], loss: 1.154, per_step_time: 1477ms, lr: 2.939812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:45,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.41492 samples/s/p 5:26:56 } +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1349/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9396344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43284 samples/s/p 5:25:49 } +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1351/ 1625], loss: 1.387, per_step_time: 1474ms, lr: 2.9394563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42691 samples/s/p 5:26:07 } +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1353/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 2.939278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42586 samples/s/p 5:26:08 } +2024-07-25 19:42:57,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1355/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.9390996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:57,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43041 samples/s/p 5:25:49 } +2024-07-25 19:42:59,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1357/ 1625], loss: 1.159, per_step_time: 1469ms, lr: 2.9389208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:59,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.44425 samples/s/p 5:24:56 } +2024-07-25 19:43:02,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1359/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.9387418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:02,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42746 samples/s/p 5:25:53 } +2024-07-25 19:43:05,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1361/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.9385625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:05,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43253 samples/s/p 5:25:32 } +2024-07-25 19:43:08,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1363/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.938383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:08,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43522 samples/s/p 5:25:20 } +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1365/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.938203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43579 samples/s/p 5:25:15 } +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1367/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9380231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43105 samples/s/p 5:25:29 } +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1369/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9378429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43371 samples/s/p 5:25:16 } +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1371/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.9376622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43118 samples/s/p 5:25:22 } +2024-07-25 19:43:23,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1373/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9374814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43322 samples/s/p 5:25:12 } +2024-07-25 19:43:26,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1375/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.9373005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:26,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43376 samples/s/p 5:25:07 } +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1377/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.937119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43193 samples/s/p 5:25:11 } +2024-07-25 19:43:32,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1379/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.9369374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:32,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43380 samples/s/p 5:25:01 } +2024-07-25 19:43:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1381/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.9367557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:35,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42589 samples/s/p 5:25:27 } +2024-07-25 19:43:38,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1383/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.9365734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42884 samples/s/p 5:25:13 } +2024-07-25 19:43:41,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1385/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9363911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:41,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43658 samples/s/p 5:24:42 } +2024-07-25 19:43:44,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1387/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 2.9362083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:44,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43090 samples/s/p 5:25:00 } +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1389/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9360255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43825 samples/s/p 5:24:30 } +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1391/ 1625], loss: 1.398, per_step_time: 1473ms, lr: 2.9358425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:50,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43061 samples/s/p 5:24:55 } +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1393/ 1625], loss: 1.107, per_step_time: 1477ms, lr: 2.9356592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41614 samples/s/p 5:25:44 } +2024-07-25 19:43:56,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1395/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.9354755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:56,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42933 samples/s/p 5:24:54 } +2024-07-25 19:43:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1397/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 2.9352916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42987 samples/s/p 5:24:49 } +2024-07-25 19:44:02,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1399/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.9351077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:02,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43144 samples/s/p 5:24:40 } +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1401/ 1625], loss: 1.078, per_step_time: 1476ms, lr: 2.934923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41755 samples/s/p 5:25:27 } +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1403/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9347384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43645 samples/s/p 5:24:16 } +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1405/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9345534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42969 samples/s/p 5:24:38 } +2024-07-25 19:44:13,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1407/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.9343682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:13,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42730 samples/s/p 5:24:43 } +2024-07-25 19:44:16,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1409/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.9341829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:16,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.44299 samples/s/p 5:23:44 } +2024-07-25 19:44:19,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1411/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9339972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43656 samples/s/p 5:24:04 } +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1413/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 2.9338113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42241 samples/s/p 5:24:52 } +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1415/ 1625], loss: 1.077, per_step_time: 1474ms, lr: 2.9336252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42586 samples/s/p 5:24:37 } +2024-07-25 19:44:28,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1417/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9334386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43308 samples/s/p 5:24:08 } +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1419/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.933252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43011 samples/s/p 5:24:15 } +2024-07-25 19:44:34,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1421/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 2.9330648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:34,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42808 samples/s/p 5:24:20 } +2024-07-25 19:44:37,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1423/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9328778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:37,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43309 samples/s/p 5:23:59 } +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1425/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 2.9326904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43033 samples/s/p 5:24:06 } +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1427/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 2.9325025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43498 samples/s/p 5:23:46 } +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1429/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 2.9323146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.42480 samples/s/p 5:24:20 } +2024-07-25 19:44:49,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1431/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.9321263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:49,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43726 samples/s/p 5:23:32 } +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1433/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.9319379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43602 samples/s/p 5:23:34 } +2024-07-25 19:44:55,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1435/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.931749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:55,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43843 samples/s/p 5:23:22 } +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1437/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.9315599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43552 samples/s/p 5:23:30 } +2024-07-25 19:45:01,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1439/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.931371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43737 samples/s/p 5:23:20 } +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1441/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42970 samples/s/p 5:23:45 } +2024-07-25 19:45:06,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1443/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 2.9309916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:06,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42064 samples/s/p 5:24:14 } +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1445/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.9308016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43388 samples/s/p 5:23:24 } +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1447/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.9306113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43524 samples/s/p 5:23:16 } +2024-07-25 19:45:15,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1449/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.9304209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43366 samples/s/p 5:23:19 } +2024-07-25 19:45:18,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1451/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.93023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:18,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43679 samples/s/p 5:23:04 } +2024-07-25 19:45:21,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1453/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.930039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43204 samples/s/p 5:23:18 } +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1455/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9298477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43437 samples/s/p 5:23:07 } +2024-07-25 19:45:27,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1457/ 1625], loss: 1.217, per_step_time: 1474ms, lr: 2.9296561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:27,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42409 samples/s/p 5:23:41 } +2024-07-25 19:45:30,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1459/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 2.9294642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:30,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.44065 samples/s/p 5:22:39 } +2024-07-25 19:45:33,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1461/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.9292723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:33,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42536 samples/s/p 5:23:31 } +2024-07-25 19:45:36,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1463/ 1625], loss: 1.388, per_step_time: 1475ms, lr: 2.9290799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:36,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42304 samples/s/p 5:23:36 } +2024-07-25 19:45:39,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1465/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.9288873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43004 samples/s/p 5:23:08 } +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1467/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.9286944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43744 samples/s/p 5:22:39 } +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1469/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.9285015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43358 samples/s/p 5:22:49 } +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1471/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.9283083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43487 samples/s/p 5:22:42 } +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1473/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 2.9281146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43997 samples/s/p 5:22:21 } +2024-07-25 19:45:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1475/ 1625], loss: 1.410, per_step_time: 1472ms, lr: 2.9279207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43458 samples/s/p 5:22:37 } +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1477/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.9277267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43168 samples/s/p 5:22:44 } +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1479/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9275321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43088 samples/s/p 5:22:44 } +2024-07-25 19:46:03,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1481/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 2.9273377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:03,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43273 samples/s/p 5:22:35 } +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1483/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9271429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43753 samples/s/p 5:22:15 } +2024-07-25 19:46:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1485/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9269479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:08,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43187 samples/s/p 5:22:32 } +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1487/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.9267525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43794 samples/s/p 5:22:07 } +2024-07-25 19:46:14,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1489/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.9265568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:14,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42785 samples/s/p 5:22:40 } +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1491/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.9263609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43603 samples/s/p 5:22:08 } +2024-07-25 19:46:20,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.926165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43377 samples/s/p 5:22:13 } +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1495/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.9259685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42744 samples/s/p 5:22:33 } +2024-07-25 19:46:26,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1497/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9257719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:26,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42946 samples/s/p 5:22:23 } +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1499/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.9255749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43370 samples/s/p 5:22:05 } +2024-07-25 19:46:32,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1501/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.9253777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:32,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43204 samples/s/p 5:22:08 } +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1503/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.9251803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43983 samples/s/p 5:21:37 } +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1505/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.9249826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42348 samples/s/p 5:22:32 } +2024-07-25 19:46:41,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1507/ 1625], loss: 0.925, per_step_time: 1474ms, lr: 2.9247849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:41,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42559 samples/s/p 5:22:22 } +2024-07-25 19:46:44,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1509/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9245868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43839 samples/s/p 5:21:33 } +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1511/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9243884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42865 samples/s/p 5:22:05 } +2024-07-25 19:46:50,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1513/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.9241895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:50,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42889 samples/s/p 5:22:01 } +2024-07-25 19:46:53,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1515/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9239907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:53,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43203 samples/s/p 5:21:47 } +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1517/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9237914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43627 samples/s/p 5:21:29 } +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1519/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.923592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43447 samples/s/p 5:21:33 } +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1521/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9233923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:02,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43438 samples/s/p 5:21:30 } +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1523/ 1625], loss: 1.392, per_step_time: 1470ms, lr: 2.9231926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43849 samples/s/p 5:21:12 } +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1525/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9229921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43261 samples/s/p 5:21:30 } +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1527/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9227918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43732 samples/s/p 5:21:11 } +2024-07-25 19:47:13,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1529/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.922591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43636 samples/s/p 5:21:11 } +2024-07-25 19:47:16,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1531/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.92239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:16,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43807 samples/s/p 5:21:02 } +2024-07-25 19:47:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1533/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.922189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43017 samples/s/p 5:21:27 } +2024-07-25 19:47:22,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1535/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 2.9219877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.42945 samples/s/p 5:21:27 } +2024-07-25 19:47:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1537/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9217857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42890 samples/s/p 5:21:26 } +2024-07-25 19:47:28,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1539/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9215838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43544 samples/s/p 5:21:00 } +2024-07-25 19:47:31,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1541/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.9213817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:31,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42945 samples/s/p 5:21:18 } +2024-07-25 19:47:34,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1543/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.9211793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:34,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42973 samples/s/p 5:21:14 } +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1545/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.9209765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43667 samples/s/p 5:20:47 } +2024-07-25 19:47:40,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1547/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 2.9207737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:40,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42783 samples/s/p 5:21:15 } +2024-07-25 19:47:43,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1549/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.9205703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:43,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43111 samples/s/p 5:21:00 } +2024-07-25 19:47:46,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1551/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.9203668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42772 samples/s/p 5:21:09 } +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1553/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.920163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.42801 samples/s/p 5:21:06 } +2024-07-25 19:47:52,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1555/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9199591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:52,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43121 samples/s/p 5:20:51 } +2024-07-25 19:47:55,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1557/ 1625], loss: 1.030, per_step_time: 1473ms, lr: 2.9197548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43042 samples/s/p 5:20:51 } +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1559/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9195504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43233 samples/s/p 5:20:41 } +2024-07-25 19:48:01,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1561/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.9193456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:01,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43414 samples/s/p 5:20:32 } +2024-07-25 19:48:04,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1563/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.9191406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:04,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43710 samples/s/p 5:20:19 } +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1565/ 1625], loss: 1.333, per_step_time: 1485ms, lr: 2.9189354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.38389 samples/s/p 5:23:26 } +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1567/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.9187298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43969 samples/s/p 5:20:04 } +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1569/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.9185241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.44107 samples/s/p 5:19:56 } +2024-07-25 19:48:15,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1571/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.9183184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:15,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42916 samples/s/p 5:20:35 } +2024-07-25 19:48:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1573/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.918112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:18,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43869 samples/s/p 5:19:58 } +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1575/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.9179055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43580 samples/s/p 5:20:05 } +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1577/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9176985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43174 samples/s/p 5:20:17 } +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1579/ 1625], loss: 1.100, per_step_time: 1478ms, lr: 2.9174918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.41092 samples/s/p 5:21:28 } +2024-07-25 19:48:30,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1581/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 2.9172843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42240 samples/s/p 5:20:44 } +2024-07-25 19:48:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1583/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.917077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:33,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43369 samples/s/p 5:20:01 } +2024-07-25 19:48:36,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1585/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9168692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.42830 samples/s/p 5:20:17 } +2024-07-25 19:48:39,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1587/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.9166611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43890 samples/s/p 5:19:37 } +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1589/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.916453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43268 samples/s/p 5:19:56 } +2024-07-25 19:48:45,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1591/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.9162444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:45,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43547 samples/s/p 5:19:43 } +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1593/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.9160356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43285 samples/s/p 5:19:49 } +2024-07-25 19:48:51,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1595/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.9158266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.44045 samples/s/p 5:19:20 } +2024-07-25 19:48:54,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1597/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.915617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:54,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43414 samples/s/p 5:19:39 } +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1599/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9154075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43623 samples/s/p 5:19:29 } +2024-07-25 19:49:00,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1601/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.9151977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:00,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42527 samples/s/p 5:20:04 } +2024-07-25 19:49:03,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1603/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 2.9149878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:03,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43385 samples/s/p 5:19:31 } +2024-07-25 19:49:06,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1605/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 2.9147775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:06,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43144 samples/s/p 5:19:37 } +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1607/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.9145669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43241 samples/s/p 5:19:30 } +2024-07-25 19:49:12,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1609/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.914356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:12,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42762 samples/s/p 5:19:44 } +2024-07-25 19:49:15,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1611/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 2.914145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:15,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43479 samples/s/p 5:19:16 } +2024-07-25 19:49:17,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1613/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9139337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43115 samples/s/p 5:19:26 } +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1615/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.9137222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43663 samples/s/p 5:19:04 } +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1617/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 2.9135103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.44208 samples/s/p 5:18:42 } +2024-07-25 19:49:26,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1619/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9132983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:26,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.42829 samples/s/p 5:19:27 } +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1621/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.913086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43914 samples/s/p 5:18:46 } +2024-07-25 19:49:32,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1623/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9128734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:32,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43407 samples/s/p 5:19:01 } +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1625/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 2.9126608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42582 samples/s/p 5:19:27 } +2024-07-25 19:49:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 2/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 2.9124476e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42146 samples/s/p 5:19:40 } +2024-07-25 19:49:41,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 4/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.9122342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:41,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43136 samples/s/p 5:19:02 } +2024-07-25 19:49:44,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 6/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 2.9120209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42975 samples/s/p 5:19:04 } +2024-07-25 19:49:47,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 8/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.911807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:47,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43157 samples/s/p 5:18:55 } +2024-07-25 19:49:50,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 10/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.911593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43167 samples/s/p 5:18:52 } +2024-07-25 19:49:53,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 12/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9113786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43382 samples/s/p 5:18:41 } +2024-07-25 19:49:56,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 14/ 1625], loss: 1.333, per_step_time: 1470ms, lr: 2.911164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:56,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43848 samples/s/p 5:18:22 } +2024-07-25 19:49:59,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 16/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.9109493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:59,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42916 samples/s/p 5:18:52 } +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 18/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.9107341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43818 samples/s/p 5:18:17 } +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 20/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.910519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43425 samples/s/p 5:18:28 } +2024-07-25 19:50:08,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 22/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.9103032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:08,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42764 samples/s/p 5:18:48 } +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.9100875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43572 samples/s/p 5:18:17 } +2024-07-25 19:50:14,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 26/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.9098714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43310 samples/s/p 5:18:23 } +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 28/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9096549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43819 samples/s/p 5:18:02 } +2024-07-25 19:50:19,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 30/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.9094384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:19,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43251 samples/s/p 5:18:19 } +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 32/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 2.9092214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42379 samples/s/p 5:18:47 } +2024-07-25 19:50:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 34/ 1625], loss: 1.247, per_step_time: 1474ms, lr: 2.9090043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42574 samples/s/p 5:18:37 } +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 36/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 2.9087872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43974 samples/s/p 5:17:45 } +2024-07-25 19:50:31,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 38/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.9085697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43530 samples/s/p 5:17:58 } +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 40/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9083518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43199 samples/s/p 5:18:06 } +2024-07-25 19:50:37,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 42/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.9081337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:37,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43429 samples/s/p 5:17:55 } +2024-07-25 19:50:40,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 44/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 2.9079154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43236 samples/s/p 5:17:59 } +2024-07-25 19:50:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 46/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.9076968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:43,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44058 samples/s/p 5:17:27 } +2024-07-25 19:50:46,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 48/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9074781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:46,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43161 samples/s/p 5:17:56 } +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 50/ 1625], loss: 1.345, per_step_time: 1470ms, lr: 2.907259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44138 samples/s/p 5:17:19 } +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 52/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.9070396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43202 samples/s/p 5:17:49 } +2024-07-25 19:50:55,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 54/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9068198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43610 samples/s/p 5:17:31 } +2024-07-25 19:50:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 56/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.9066001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43328 samples/s/p 5:17:38 } +2024-07-25 19:51:01,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 58/ 1625], loss: 1.227, per_step_time: 1474ms, lr: 2.9063798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:01,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42587 samples/s/p 5:18:01 } +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 60/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9061597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43268 samples/s/p 5:17:35 } +2024-07-25 19:51:07,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 62/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.9059389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:07,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42764 samples/s/p 5:17:49 } +2024-07-25 19:51:10,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 64/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 2.9057182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42934 samples/s/p 5:17:40 } +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 66/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 2.905497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43079 samples/s/p 5:17:32 } +2024-07-25 19:51:16,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 68/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9052757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43200 samples/s/p 5:17:25 } +2024-07-25 19:51:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 70/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.9050541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43527 samples/s/p 5:17:11 } +2024-07-25 19:51:21,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 72/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9048324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:21,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43267 samples/s/p 5:17:17 } +2024-07-25 19:51:24,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 74/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.9046103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:24,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43149 samples/s/p 5:17:18 } +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 76/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9043878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43302 samples/s/p 5:17:10 } +2024-07-25 19:51:30,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 78/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.9041654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:30,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43612 samples/s/p 5:16:56 } +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 80/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.9039425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42949 samples/s/p 5:17:16 } +2024-07-25 19:51:36,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 82/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.9037194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:36,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43098 samples/s/p 5:17:08 } +2024-07-25 19:51:39,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 84/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 2.903496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:39,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42674 samples/s/p 5:17:20 } +2024-07-25 19:51:42,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 86/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 2.9032724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:42,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42215 samples/s/p 5:17:33 } +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 88/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.9030487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43631 samples/s/p 5:16:41 } +2024-07-25 19:51:48,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 90/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.9028244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:48,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43481 samples/s/p 5:16:43 } +2024-07-25 19:51:51,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 92/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.9026001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43649 samples/s/p 5:16:34 } +2024-07-25 19:51:54,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 94/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.9023757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:54,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43316 samples/s/p 5:16:43 } +2024-07-25 19:51:57,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 96/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9021508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:57,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43593 samples/s/p 5:16:30 } +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 98/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9019258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43715 samples/s/p 5:16:23 } +2024-07-25 19:52:03,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 100/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9017005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.42860 samples/s/p 5:16:50 } +2024-07-25 19:52:06,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 102/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.9014749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43837 samples/s/p 5:16:13 } +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 104/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.9012492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43284 samples/s/p 5:16:29 } +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 106/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.901023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43605 samples/s/p 5:16:15 } +2024-07-25 19:52:15,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 108/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.9007966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43542 samples/s/p 5:16:14 } +2024-07-25 19:52:18,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 110/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.90057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:18,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43557 samples/s/p 5:16:11 } +2024-07-25 19:52:21,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 112/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.900343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42909 samples/s/p 5:16:31 } +2024-07-25 19:52:23,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 114/ 1625], loss: 1.314, per_step_time: 1473ms, lr: 2.900116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:23,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43009 samples/s/p 5:16:24 } +2024-07-25 19:52:26,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 116/ 1625], loss: 1.367, per_step_time: 1469ms, lr: 2.8998888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:26,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.44218 samples/s/p 5:15:39 } +2024-07-25 19:52:29,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 118/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.899661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:29,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43359 samples/s/p 5:16:06 } +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 120/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8994333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42769 samples/s/p 5:16:24 } +2024-07-25 19:52:35,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 122/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.8992054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:35,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43282 samples/s/p 5:16:03 } +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 124/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 2.898977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43786 samples/s/p 5:15:42 } +2024-07-25 19:52:41,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 126/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.8987482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:41,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43234 samples/s/p 5:15:59 } +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 128/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8985194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43154 samples/s/p 5:15:58 } +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 130/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.8982906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43069 samples/s/p 5:15:58 } +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 132/ 1625], loss: 1.306, per_step_time: 1474ms, lr: 2.8980612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42395 samples/s/p 5:16:19 } +2024-07-25 19:52:53,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 134/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.8978317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:53,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43063 samples/s/p 5:15:53 } +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 136/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.8976017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42937 samples/s/p 5:15:54 } +2024-07-25 19:52:59,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 138/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.8973716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:59,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43799 samples/s/p 5:15:21 } +2024-07-25 19:53:02,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 140/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.8971413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:02,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43158 samples/s/p 5:15:41 } +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 142/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8969109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43215 samples/s/p 5:15:36 } +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 144/ 1625], loss: 1.292, per_step_time: 1473ms, lr: 2.89668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42995 samples/s/p 5:15:40 } +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 146/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8964489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43580 samples/s/p 5:15:17 } +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 148/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8962177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:14,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43308 samples/s/p 5:15:24 } +2024-07-25 19:53:17,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 150/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8959861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43333 samples/s/p 5:15:20 } +2024-07-25 19:53:20,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 152/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.895754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42950 samples/s/p 5:15:30 } +2024-07-25 19:53:23,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 154/ 1625], loss: 1.245, per_step_time: 1475ms, lr: 2.895522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42226 samples/s/p 5:15:52 } +2024-07-25 19:53:25,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 156/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.8952898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:25,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43988 samples/s/p 5:14:48 } +2024-07-25 19:53:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 158/ 1625], loss: 1.305, per_step_time: 1473ms, lr: 2.8950573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:28,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43053 samples/s/p 5:15:18 } +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 160/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.8948245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42792 samples/s/p 5:15:24 } +2024-07-25 19:53:34,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 162/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.8945915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43726 samples/s/p 5:14:48 } +2024-07-25 19:53:37,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 164/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.8943581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:37,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43195 samples/s/p 5:15:04 } +2024-07-25 19:53:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 166/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.8941244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43643 samples/s/p 5:14:45 } +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 168/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8938906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43548 samples/s/p 5:14:46 } +2024-07-25 19:53:46,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 170/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.8936567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43196 samples/s/p 5:14:55 } +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 172/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.8934224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42284 samples/s/p 5:15:24 } +2024-07-25 19:53:52,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 174/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.893188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43567 samples/s/p 5:14:36 } +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 176/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8929531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43455 samples/s/p 5:14:37 } +2024-07-25 19:53:58,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 178/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.8927181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43323 samples/s/p 5:14:39 } +2024-07-25 19:54:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 180/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.892483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:01,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42852 samples/s/p 5:14:52 } +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 182/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.8922472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43012 samples/s/p 5:14:44 } +2024-07-25 19:54:07,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.8920114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:07,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43392 samples/s/p 5:14:28 } +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 186/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.8917755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43377 samples/s/p 5:14:25 } +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 188/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.8915392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43989 samples/s/p 5:14:01 } +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 190/ 1625], loss: 1.189, per_step_time: 1469ms, lr: 2.8913028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.44220 samples/s/p 5:13:50 } +2024-07-25 19:54:19,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 192/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.891066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:19,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43209 samples/s/p 5:14:22 } +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 194/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.890829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43610 samples/s/p 5:14:05 } +2024-07-25 19:54:25,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 196/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.8905917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43957 samples/s/p 5:13:50 } +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 198/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 2.8903542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43886 samples/s/p 5:13:50 } +2024-07-25 19:54:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 200/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.8901162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43427 samples/s/p 5:14:03 } +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 202/ 1625], loss: 0.911, per_step_time: 1472ms, lr: 2.8898783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43350 samples/s/p 5:14:03 } +2024-07-25 19:54:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 204/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.8896402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43139 samples/s/p 5:14:07 } +2024-07-25 19:54:39,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 206/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.8894017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42800 samples/s/p 5:14:16 } +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 208/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 2.8891629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43848 samples/s/p 5:13:37 } +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 210/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 2.8889239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42673 samples/s/p 5:14:14 } +2024-07-25 19:54:48,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 212/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.8886847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43625 samples/s/p 5:13:38 } +2024-07-25 19:54:51,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 214/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 2.8884451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42538 samples/s/p 5:14:13 } +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 216/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.8882056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43629 samples/s/p 5:13:32 } +2024-07-25 19:54:57,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 218/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 2.8879656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:57,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43382 samples/s/p 5:13:38 } +2024-07-25 19:55:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 220/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.8877253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43592 samples/s/p 5:13:28 } +2024-07-25 19:55:03,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 222/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8874847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43316 samples/s/p 5:13:34 } +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 224/ 1625], loss: 1.312, per_step_time: 1474ms, lr: 2.8872442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42722 samples/s/p 5:13:52 } +2024-07-25 19:55:09,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 226/ 1625], loss: 1.336, per_step_time: 1474ms, lr: 2.8870032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:09,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42586 samples/s/p 5:13:54 } +2024-07-25 19:55:12,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 228/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8867618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:12,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43447 samples/s/p 5:13:21 } +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 230/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8865205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43341 samples/s/p 5:13:22 } +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 232/ 1625], loss: 1.200, per_step_time: 1474ms, lr: 2.8862785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42737 samples/s/p 5:13:40 } +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 234/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.8860366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42855 samples/s/p 5:13:33 } +2024-07-25 19:55:24,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 236/ 1625], loss: 1.114, per_step_time: 1474ms, lr: 2.8857945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:24,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.42390 samples/s/p 5:13:46 } +2024-07-25 19:55:27,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 238/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.8855518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:27,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43364 samples/s/p 5:13:09 } +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 240/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.8853092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43241 samples/s/p 5:13:10 } +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 242/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.8850664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43750 samples/s/p 5:12:50 } +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 244/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.8848232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43477 samples/s/p 5:12:56 } +2024-07-25 19:55:38,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 246/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 2.8845798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:38,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43949 samples/s/p 5:12:37 } +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 248/ 1625], loss: 1.535, per_step_time: 1470ms, lr: 2.884336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.44078 samples/s/p 5:12:30 } +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 250/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.884092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43360 samples/s/p 5:12:52 } +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 252/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.883848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43295 samples/s/p 5:12:51 } +2024-07-25 19:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 254/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8836035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43785 samples/s/p 5:12:31 } +2024-07-25 19:55:53,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 256/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.8833589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43827 samples/s/p 5:12:27 } +2024-07-25 19:55:56,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 258/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 2.883114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:56,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43428 samples/s/p 5:12:37 } +2024-07-25 19:55:59,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 260/ 1625], loss: 1.411, per_step_time: 1474ms, lr: 2.8828688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42679 samples/s/p 5:13:00 } +2024-07-25 19:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 262/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 2.8826234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:02,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43132 samples/s/p 5:12:42 } +2024-07-25 19:56:05,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 264/ 1625], loss: 1.197, per_step_time: 1474ms, lr: 2.8823779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:05,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42632 samples/s/p 5:12:56 } +2024-07-25 19:56:08,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 266/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.8821318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42873 samples/s/p 5:12:45 } +2024-07-25 19:56:11,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 268/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.8818857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:11,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43937 samples/s/p 5:12:05 } +2024-07-25 19:56:14,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 270/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.8816394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:14,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43827 samples/s/p 5:12:06 } +2024-07-25 19:56:17,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 272/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.8813927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:17,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43380 samples/s/p 5:12:18 } +2024-07-25 19:56:20,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 274/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8811459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43363 samples/s/p 5:12:16 } +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 276/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 2.8808987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42557 samples/s/p 5:12:41 } +2024-07-25 19:56:26,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 278/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.8806513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:26,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42783 samples/s/p 5:12:30 } +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 280/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.8804037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43624 samples/s/p 5:11:58 } +2024-07-25 19:56:31,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 282/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.8801558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42824 samples/s/p 5:12:23 } +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 284/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.8799077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43726 samples/s/p 5:11:49 } +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 286/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.8796594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43791 samples/s/p 5:11:44 } +2024-07-25 19:56:40,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 288/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.8794107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:40,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43836 samples/s/p 5:11:39 } +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 290/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.879162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43528 samples/s/p 5:11:47 } +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 292/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.8789127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:46,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43489 samples/s/p 5:11:45 } +2024-07-25 19:56:49,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 294/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.8786633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:49,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43692 samples/s/p 5:11:35 } +2024-07-25 19:56:52,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 296/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8784138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:52,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43519 samples/s/p 5:11:38 } +2024-07-25 19:56:55,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 298/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8781642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:55,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43351 samples/s/p 5:11:41 } +2024-07-25 19:56:58,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 300/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8779139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:58,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43872 samples/s/p 5:11:20 } +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 302/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 2.8776638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43810 samples/s/p 5:11:20 } +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 304/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.8774133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42779 samples/s/p 5:11:52 } +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 306/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.8771623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43169 samples/s/p 5:11:36 } +2024-07-25 19:57:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 308/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.8769113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:10,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43807 samples/s/p 5:11:11 } +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 310/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.87666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42778 samples/s/p 5:11:43 } +2024-07-25 19:57:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 312/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.8764085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:16,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42995 samples/s/p 5:11:33 } +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 314/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 2.8761566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42497 samples/s/p 5:11:47 } +2024-07-25 19:57:22,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 316/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.8759046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43421 samples/s/p 5:11:12 } +2024-07-25 19:57:25,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 318/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8756524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43319 samples/s/p 5:11:13 } +2024-07-25 19:57:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 320/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.8753999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:28,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43608 samples/s/p 5:11:00 } +2024-07-25 19:57:30,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 322/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.875147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43244 samples/s/p 5:11:10 } +2024-07-25 19:57:33,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 324/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8748942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.42792 samples/s/p 5:11:22 } +2024-07-25 19:57:36,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 326/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 2.8746406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43909 samples/s/p 5:10:41 } +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 328/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.8743872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43398 samples/s/p 5:10:55 } +2024-07-25 19:57:42,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 330/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.8741335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43510 samples/s/p 5:10:49 } +2024-07-25 19:57:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 332/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.8738794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:45,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43710 samples/s/p 5:10:39 } +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 334/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.8736255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43415 samples/s/p 5:10:46 } +2024-07-25 19:57:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 336/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 2.8733708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:51,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43014 samples/s/p 5:10:57 } +2024-07-25 19:57:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 338/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8731161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:54,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43278 samples/s/p 5:10:45 } +2024-07-25 19:57:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 340/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.8728611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:57,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43064 samples/s/p 5:10:49 } +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 342/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.872606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43836 samples/s/p 5:10:20 } +2024-07-25 19:58:03,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 344/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8723503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:03,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43085 samples/s/p 5:10:43 } +2024-07-25 19:58:06,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 346/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.8720948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:06,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43145 samples/s/p 5:10:38 } +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 348/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.871839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.42963 samples/s/p 5:10:41 } +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 350/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.8715825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.44028 samples/s/p 5:10:01 } +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 352/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8713264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43158 samples/s/p 5:10:28 } +2024-07-25 19:58:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 354/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.8710696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43699 samples/s/p 5:10:07 } +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 356/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.8708128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43185 samples/s/p 5:10:22 } +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 358/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.8705555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43322 samples/s/p 5:10:14 } +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 360/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.8702983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43797 samples/s/p 5:09:55 } +2024-07-25 19:58:30,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 362/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8700404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43708 samples/s/p 5:09:55 } +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 364/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.8697825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43941 samples/s/p 5:09:44 } +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 366/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.8695245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43677 samples/s/p 5:09:50 } +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 368/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.869266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43735 samples/s/p 5:09:45 } +2024-07-25 19:58:41,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 370/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.8690074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:41,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42965 samples/s/p 5:10:08 } +2024-07-25 19:58:44,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 372/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.8687486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:44,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43288 samples/s/p 5:09:54 } +2024-07-25 19:58:47,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 374/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.8684895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43831 samples/s/p 5:09:33 } +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 376/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 2.8682301e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43570 samples/s/p 5:09:39 } +2024-07-25 19:58:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 378/ 1625], loss: 1.099, per_step_time: 1475ms, lr: 2.8679706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42096 samples/s/p 5:10:26 } +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 380/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.8677106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43231 samples/s/p 5:09:45 } +2024-07-25 19:58:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 382/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.8674505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:59,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43387 samples/s/p 5:09:36 } +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 384/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 2.8671904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.42994 samples/s/p 5:09:47 } +2024-07-25 19:59:05,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 386/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.8669298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:05,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43366 samples/s/p 5:09:31 } +2024-07-25 19:59:08,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 388/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 2.8666691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:08,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.42957 samples/s/p 5:09:42 } +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 390/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.866408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43459 samples/s/p 5:09:22 } +2024-07-25 19:59:14,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 392/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.8661465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:14,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.44116 samples/s/p 5:08:57 } +2024-07-25 19:59:17,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 394/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.865885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43242 samples/s/p 5:09:24 } +2024-07-25 19:59:20,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 396/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8656234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:20,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43479 samples/s/p 5:09:13 } +2024-07-25 19:59:23,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 398/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8653612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43396 samples/s/p 5:09:12 } +2024-07-25 19:59:26,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 400/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.865099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:26,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42943 samples/s/p 5:09:25 } +2024-07-25 19:59:29,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 402/ 1625], loss: 0.941, per_step_time: 1470ms, lr: 2.8648365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43980 samples/s/p 5:08:47 } +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 404/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8645738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43792 samples/s/p 5:08:50 } +2024-07-25 19:59:34,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 406/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 2.8643106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43340 samples/s/p 5:09:03 } +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 408/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 2.8640474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42704 samples/s/p 5:09:21 } +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 410/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.863784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43524 samples/s/p 5:08:50 } +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 412/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8635202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43457 samples/s/p 5:08:50 } +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 414/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.8632563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43123 samples/s/p 5:08:58 } +2024-07-25 19:59:49,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 416/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8629922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:49,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43784 samples/s/p 5:08:33 } +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 418/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.8627277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43354 samples/s/p 5:08:44 } +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 420/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.8624629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43788 samples/s/p 5:08:27 } +2024-07-25 19:59:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 422/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.862198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:58,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44006 samples/s/p 5:08:16 } +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 424/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.8619328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44080 samples/s/p 5:08:11 } +2024-07-25 20:00:04,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 426/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.8616674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43543 samples/s/p 5:08:26 } +2024-07-25 20:00:07,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 428/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.8614015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:07,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44029 samples/s/p 5:08:07 } +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 430/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.8611357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43402 samples/s/p 5:08:25 } +2024-07-25 20:00:13,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 432/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.8608694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:13,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43694 samples/s/p 5:08:12 } +2024-07-25 20:00:16,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 434/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.8606033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:16,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.44192 samples/s/p 5:07:52 } +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 436/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8603366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43336 samples/s/p 5:08:19 } +2024-07-25 20:00:22,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 438/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.8600698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:22,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43269 samples/s/p 5:08:18 } +2024-07-25 20:00:25,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 440/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.8598026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43795 samples/s/p 5:07:57 } +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 442/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8595354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43189 samples/s/p 5:08:15 } +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 444/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.8592678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43344 samples/s/p 5:08:06 } +2024-07-25 20:00:33,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 446/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.8589999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.42841 samples/s/p 5:08:21 } +2024-07-25 20:00:36,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 448/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.858732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:36,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43281 samples/s/p 5:08:03 } +2024-07-25 20:00:39,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 450/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.8584634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:39,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43577 samples/s/p 5:07:50 } +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 452/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.858195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42985 samples/s/p 5:08:07 } +2024-07-25 20:00:45,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 454/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.8579261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43957 samples/s/p 5:07:31 } +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 456/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.857657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42874 samples/s/p 5:08:05 } +2024-07-25 20:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.8573877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43018 samples/s/p 5:07:57 } +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 460/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.8571181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42779 samples/s/p 5:08:02 } +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 462/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.8568486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43525 samples/s/p 5:07:34 } +2024-07-25 20:01:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 464/ 1625], loss: 1.383, per_step_time: 1473ms, lr: 2.8565784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42981 samples/s/p 5:07:49 } +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 466/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.8563083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.44131 samples/s/p 5:07:07 } +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 468/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 2.8560375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43720 samples/s/p 5:07:18 } +2024-07-25 20:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.8557668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42914 samples/s/p 5:07:43 } +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 472/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.855496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43158 samples/s/p 5:07:32 } +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 474/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.8552247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43780 samples/s/p 5:07:08 } +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 476/ 1625], loss: 1.055, per_step_time: 1474ms, lr: 2.8549533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42433 samples/s/p 5:07:50 } +2024-07-25 20:01:21,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 478/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8546816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43317 samples/s/p 5:07:17 } +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 480/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.8544096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43431 samples/s/p 5:07:11 } +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 482/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.8541375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43485 samples/s/p 5:07:06 } +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 484/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.853865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43671 samples/s/p 5:06:57 } +2024-07-25 20:01:33,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 486/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.8535924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43608 samples/s/p 5:06:56 } +2024-07-25 20:01:35,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 488/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.8533195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:35,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43521 samples/s/p 5:06:56 } +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 490/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.8530465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43046 samples/s/p 5:07:09 } +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 492/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.8527731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43287 samples/s/p 5:06:58 } +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 494/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.8524992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43631 samples/s/p 5:06:43 } +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 496/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.8522254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43381 samples/s/p 5:06:49 } +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 498/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.8519513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43713 samples/s/p 5:06:34 } +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 500/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.8516772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43750 samples/s/p 5:06:30 } +2024-07-25 20:01:56,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 502/ 1625], loss: 1.412, per_step_time: 1474ms, lr: 2.8514025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.42561 samples/s/p 5:07:08 } +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 504/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.8511276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43576 samples/s/p 5:06:30 } +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 506/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.8508526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43150 samples/s/p 5:06:42 } +2024-07-25 20:02:05,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 508/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8505772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.44062 samples/s/p 5:06:08 } +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 510/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.8503016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43287 samples/s/p 5:06:31 } +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 512/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.8500259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43624 samples/s/p 5:06:17 } +2024-07-25 20:02:14,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 514/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.8497498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.42783 samples/s/p 5:06:42 } +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 516/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.8494736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43840 samples/s/p 5:06:04 } +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 518/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.849197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43155 samples/s/p 5:06:24 } +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 520/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8489203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43644 samples/s/p 5:06:04 } +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 522/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.8486435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43049 samples/s/p 5:06:22 } +2024-07-25 20:02:29,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 524/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.848366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:29,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43979 samples/s/p 5:05:47 } +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 526/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.8480888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43563 samples/s/p 5:05:58 } +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 528/ 1625], loss: 1.487, per_step_time: 1470ms, lr: 2.8478109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43972 samples/s/p 5:05:42 } +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 530/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 2.8475331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43104 samples/s/p 5:06:08 } +2024-07-25 20:02:40,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 532/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.8472548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43929 samples/s/p 5:05:37 } +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 534/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.8469765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43356 samples/s/p 5:05:54 } +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 536/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.8466979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43767 samples/s/p 5:05:37 } +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 538/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.846419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43698 samples/s/p 5:05:36 } +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 540/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.84614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43891 samples/s/p 5:05:27 } +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 542/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.8458602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43829 samples/s/p 5:05:26 } +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 544/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.845581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43610 samples/s/p 5:05:30 } +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 546/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.8453009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.42900 samples/s/p 5:05:51 } +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 548/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.845021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43849 samples/s/p 5:05:16 } +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 550/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.8447404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43491 samples/s/p 5:05:25 } +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 552/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 2.8444598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43237 samples/s/p 5:05:31 } +2024-07-25 20:03:13,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 554/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.8441791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43567 samples/s/p 5:05:17 } +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 556/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.843898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43832 samples/s/p 5:05:05 } +2024-07-25 20:03:19,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 558/ 1625], loss: 1.013, per_step_time: 1469ms, lr: 2.8436167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:19,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.44342 samples/s/p 5:04:45 } +2024-07-25 20:03:22,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 560/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 2.8433353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43004 samples/s/p 5:05:27 } +2024-07-25 20:03:25,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 562/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.8430537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43098 samples/s/p 5:05:21 } +2024-07-25 20:03:28,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 564/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.8427714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:28,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43852 samples/s/p 5:04:53 } +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 566/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8424893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43972 samples/s/p 5:04:46 } +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 568/ 1625], loss: 1.203, per_step_time: 1476ms, lr: 2.8422068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.41715 samples/s/p 5:05:59 } +2024-07-25 20:03:36,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 570/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.8419241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:36,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43784 samples/s/p 5:04:46 } +2024-07-25 20:03:39,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 572/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.841641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43828 samples/s/p 5:04:42 } +2024-07-25 20:03:42,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 574/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.8413579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43322 samples/s/p 5:04:56 } +2024-07-25 20:03:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 576/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.8410743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43500 samples/s/p 5:04:47 } +2024-07-25 20:03:48,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 578/ 1625], loss: 1.349, per_step_time: 1471ms, lr: 2.8407909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43526 samples/s/p 5:04:43 } +2024-07-25 20:03:51,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 580/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.8405067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:51,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43467 samples/s/p 5:04:42 } +2024-07-25 20:03:54,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 582/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.8402226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:54,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43288 samples/s/p 5:04:45 } +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 584/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 2.8399383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.42472 samples/s/p 5:05:10 } +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 586/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8396536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43085 samples/s/p 5:04:46 } +2024-07-25 20:04:03,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 588/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8393688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:03,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43618 samples/s/p 5:04:25 } +2024-07-25 20:04:06,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 590/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.8390838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:06,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.44107 samples/s/p 5:04:06 } +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 592/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.8387982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43914 samples/s/p 5:04:09 } +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 594/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.8385126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43912 samples/s/p 5:04:07 } +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 596/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.8382266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43341 samples/s/p 5:04:23 } +2024-07-25 20:04:18,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 598/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.8379409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:18,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43163 samples/s/p 5:04:26 } +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.8376546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43481 samples/s/p 5:04:12 } +2024-07-25 20:04:24,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 602/ 1625], loss: 1.389, per_step_time: 1471ms, lr: 2.8373679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43588 samples/s/p 5:04:06 } +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 604/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.8370812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43929 samples/s/p 5:03:51 } +2024-07-25 20:04:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 606/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.8367942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:30,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.44118 samples/s/p 5:03:42 } +2024-07-25 20:04:33,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 608/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.836507e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43741 samples/s/p 5:03:52 } +2024-07-25 20:04:35,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 610/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 2.8362196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:35,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43954 samples/s/p 5:03:42 } +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 612/ 1625], loss: 1.135, per_step_time: 1474ms, lr: 2.835932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42412 samples/s/p 5:04:30 } +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 614/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.8356437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42704 samples/s/p 5:04:18 } +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 616/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8353556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43457 samples/s/p 5:03:49 } +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 618/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.8350672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43810 samples/s/p 5:03:35 } +2024-07-25 20:04:50,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 620/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.8347786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43733 samples/s/p 5:03:34 } +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 622/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.8344895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43834 samples/s/p 5:03:28 } +2024-07-25 20:04:56,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 624/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8342007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:56,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43952 samples/s/p 5:03:21 } +2024-07-25 20:04:59,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 626/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.8339113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:59,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43026 samples/s/p 5:03:49 } +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 628/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.8336215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43223 samples/s/p 5:03:40 } +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 630/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8333317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42929 samples/s/p 5:03:47 } +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 632/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 2.8330414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42784 samples/s/p 5:03:48 } +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 634/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 2.8327513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42923 samples/s/p 5:03:41 } +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 636/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.8324606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42923 samples/s/p 5:03:38 } +2024-07-25 20:05:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 638/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 2.83217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:17,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43518 samples/s/p 5:03:15 } +2024-07-25 20:05:20,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 640/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.831879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:20,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43578 samples/s/p 5:03:10 } +2024-07-25 20:05:23,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 642/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.8315875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43829 samples/s/p 5:02:59 } +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 644/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 2.831296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42848 samples/s/p 5:03:29 } +2024-07-25 20:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 646/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.8310042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43742 samples/s/p 5:02:56 } +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 648/ 1625], loss: 1.377, per_step_time: 1474ms, lr: 2.8307122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42663 samples/s/p 5:03:29 } +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 650/ 1625], loss: 1.391, per_step_time: 1469ms, lr: 2.8304199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44258 samples/s/p 5:02:33 } +2024-07-25 20:05:37,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 652/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.8301274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43756 samples/s/p 5:02:46 } +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 654/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.8298351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.42870 samples/s/p 5:03:13 } +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 656/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.829542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43774 samples/s/p 5:02:40 } +2024-07-25 20:05:46,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 658/ 1625], loss: 1.197, per_step_time: 1470ms, lr: 2.829249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:46,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43978 samples/s/p 5:02:30 } +2024-07-25 20:05:49,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 660/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.8289556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43728 samples/s/p 5:02:36 } +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 662/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.828662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43582 samples/s/p 5:02:38 } +2024-07-25 20:05:55,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 664/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 2.8283679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:55,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43144 samples/s/p 5:02:49 } +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 666/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8280738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43060 samples/s/p 5:02:49 } +2024-07-25 20:06:01,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 668/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.8277795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:01,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43368 samples/s/p 5:02:36 } +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 670/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.827485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43921 samples/s/p 5:02:14 } +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 672/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.8271901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43680 samples/s/p 5:02:20 } +2024-07-25 20:06:10,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 674/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.826895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43523 samples/s/p 5:02:22 } +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 676/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.8265997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43916 samples/s/p 5:02:06 } +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 678/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.826304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43246 samples/s/p 5:02:25 } +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 680/ 1625], loss: 1.368, per_step_time: 1473ms, lr: 2.8260083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43006 samples/s/p 5:02:30 } +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 682/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.8257125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43412 samples/s/p 5:02:14 } +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 684/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.8254162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43457 samples/s/p 5:02:09 } +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 686/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.8251197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.44194 samples/s/p 5:01:42 } +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 688/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8248229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43194 samples/s/p 5:02:12 } +2024-07-25 20:06:34,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 690/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.824526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:34,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42830 samples/s/p 5:02:21 } +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 692/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.8242288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43312 samples/s/p 5:02:02 } +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 694/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.8239314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43156 samples/s/p 5:02:05 } +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 696/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.8236338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43594 samples/s/p 5:01:47 } +2024-07-25 20:06:45,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 698/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 2.823336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:45,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43083 samples/s/p 5:02:01 } +2024-07-25 20:06:48,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 700/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.8230377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43216 samples/s/p 5:01:54 } +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 702/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.8227394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43231 samples/s/p 5:01:50 } +2024-07-25 20:06:54,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 704/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.8224411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:54,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.42991 samples/s/p 5:01:55 } +2024-07-25 20:06:57,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 706/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 2.822142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:57,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43702 samples/s/p 5:01:29 } +2024-07-25 20:07:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 708/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.8218434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42483 samples/s/p 5:02:07 } +2024-07-25 20:07:03,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 710/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.821544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43060 samples/s/p 5:01:44 } +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.8212444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43429 samples/s/p 5:01:29 } +2024-07-25 20:07:09,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 714/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.8209444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:09,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43568 samples/s/p 5:01:22 } +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 716/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.8206448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43957 samples/s/p 5:01:06 } +2024-07-25 20:07:15,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 718/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.8203443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:15,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42602 samples/s/p 5:01:48 } +2024-07-25 20:07:18,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 720/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 2.8200438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:18,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43213 samples/s/p 5:01:24 } +2024-07-25 20:07:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 722/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.8197432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:21,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43785 samples/s/p 5:01:03 } +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 724/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8194423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.44036 samples/s/p 5:00:51 } +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 726/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.819141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43533 samples/s/p 5:01:05 } +2024-07-25 20:07:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 728/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8188399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43018 samples/s/p 5:01:19 } +2024-07-25 20:07:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 730/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.818538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43077 samples/s/p 5:01:14 } +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 732/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8182361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43632 samples/s/p 5:00:53 } +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 734/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.817934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43321 samples/s/p 5:01:00 } +2024-07-25 20:07:41,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 736/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 2.8176317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:41,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43652 samples/s/p 5:00:46 } +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 738/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.817329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43378 samples/s/p 5:00:52 } +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 740/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.8170265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43818 samples/s/p 5:00:35 } +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 742/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.8167233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43660 samples/s/p 5:00:37 } +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 744/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.8164202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43299 samples/s/p 5:00:46 } +2024-07-25 20:07:56,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 746/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.8161166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:56,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43797 samples/s/p 5:00:27 } +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 748/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.8158129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43214 samples/s/p 5:00:43 } +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 750/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 2.815509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43849 samples/s/p 5:00:19 } +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 752/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.8152048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.42945 samples/s/p 5:00:46 } +2024-07-25 20:08:08,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 754/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 2.8149003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43941 samples/s/p 5:00:10 } +2024-07-25 20:08:11,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 756/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.8145956e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:11,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43489 samples/s/p 5:00:22 } +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 758/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 2.8142907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43731 samples/s/p 5:00:11 } +2024-07-25 20:08:17,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 760/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.8139855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:17,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43019 samples/s/p 5:00:32 } +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 762/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.8136801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43759 samples/s/p 5:00:05 } +2024-07-25 20:08:23,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 764/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 2.8133745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:23,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43056 samples/s/p 5:00:25 } +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 766/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.8130687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43732 samples/s/p 5:00:00 } +2024-07-25 20:08:29,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 768/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.8127626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43222 samples/s/p 5:00:14 } +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 770/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.8124563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43227 samples/s/p 5:00:10 } +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 772/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 2.8121498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43836 samples/s/p 4:59:47 } +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 774/ 1625], loss: 1.152, per_step_time: 1469ms, lr: 2.8118431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44269 samples/s/p 4:59:30 } +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 776/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.811536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43960 samples/s/p 4:59:37 } +2024-07-25 20:08:43,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 778/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 2.8112287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43916 samples/s/p 4:59:36 } +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 780/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.8109214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43970 samples/s/p 4:59:31 } +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 782/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.8106135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.42944 samples/s/p 5:00:02 } +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 784/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8103057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43369 samples/s/p 4:59:45 } +2024-07-25 20:08:55,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 786/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.8099974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:55,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44493 samples/s/p 4:59:05 } +2024-07-25 20:08:58,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 788/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.8096889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:58,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43469 samples/s/p 4:59:36 } +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 790/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.8093804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43954 samples/s/p 4:59:17 } +2024-07-25 20:09:04,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 792/ 1625], loss: 1.290, per_step_time: 1471ms, lr: 2.8090715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:04,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43576 samples/s/p 4:59:26 } +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 794/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.8087625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43809 samples/s/p 4:59:16 } +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 796/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.8084534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43252 samples/s/p 4:59:31 } +2024-07-25 20:09:13,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 798/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.8081437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43014 samples/s/p 4:59:36 } +2024-07-25 20:09:16,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 800/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8078339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:16,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43878 samples/s/p 4:59:05 } +2024-07-25 20:09:19,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 802/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.8075237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:19,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43170 samples/s/p 4:59:25 } +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 804/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.8072136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43021 samples/s/p 4:59:27 } +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 806/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.8069033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43527 samples/s/p 4:59:07 } +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 808/ 1625], loss: 1.130, per_step_time: 1469ms, lr: 2.8065924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44285 samples/s/p 4:58:40 } +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 810/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.8062814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43240 samples/s/p 4:59:11 } +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 812/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.8059701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43828 samples/s/p 4:58:49 } +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 814/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 2.8056587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43664 samples/s/p 4:58:51 } +2024-07-25 20:09:39,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 816/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.8053471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:39,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43808 samples/s/p 4:58:43 } +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.8050354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43047 samples/s/p 4:59:06 } +2024-07-25 20:09:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 820/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8047232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:45,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44122 samples/s/p 4:58:27 } +2024-07-25 20:09:48,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 822/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.8044109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:48,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42837 samples/s/p 4:59:07 } +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 824/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.8040982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43390 samples/s/p 4:58:45 } +2024-07-25 20:09:54,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 826/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.8037857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43519 samples/s/p 4:58:38 } +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 828/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 2.8034725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43910 samples/s/p 4:58:22 } +2024-07-25 20:10:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 830/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.8031593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42854 samples/s/p 4:58:54 } +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 832/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.8028457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43786 samples/s/p 4:58:21 } +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 834/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.802532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43979 samples/s/p 4:58:11 } +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 836/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.8022181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43110 samples/s/p 4:58:37 } +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 838/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8019038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42752 samples/s/p 4:58:46 } +2024-07-25 20:10:15,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 840/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.8015895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:15,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43761 samples/s/p 4:58:10 } +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 842/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.8012748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43534 samples/s/p 4:58:14 } +2024-07-25 20:10:21,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 844/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 2.80096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:21,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44290 samples/s/p 4:57:46 } +2024-07-25 20:10:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 846/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 2.8006447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:24,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44026 samples/s/p 4:57:52 } +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 848/ 1625], loss: 1.213, per_step_time: 1474ms, lr: 2.8003293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42694 samples/s/p 4:58:33 } +2024-07-25 20:10:30,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 850/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.8000139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:30,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43293 samples/s/p 4:58:10 } +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 852/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.799698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44193 samples/s/p 4:57:38 } +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 854/ 1625], loss: 1.300, per_step_time: 1470ms, lr: 2.7993821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43993 samples/s/p 4:57:42 } +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 856/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.7990658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43335 samples/s/p 4:58:00 } +2024-07-25 20:10:41,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 858/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.7987491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43524 samples/s/p 4:57:51 } +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 860/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7984324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43263 samples/s/p 4:57:57 } +2024-07-25 20:10:47,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 862/ 1625], loss: 1.279, per_step_time: 1469ms, lr: 2.7981154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44254 samples/s/p 4:57:21 } +2024-07-25 20:10:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 864/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.7977982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43307 samples/s/p 4:57:49 } +2024-07-25 20:10:53,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 866/ 1625], loss: 0.923, per_step_time: 1470ms, lr: 2.7974807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44012 samples/s/p 4:57:23 } +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 868/ 1625], loss: 1.200, per_step_time: 1474ms, lr: 2.7971631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.42697 samples/s/p 4:58:04 } +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 870/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.7968452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43196 samples/s/p 4:57:44 } +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 872/ 1625], loss: 1.453, per_step_time: 1472ms, lr: 2.7965272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43426 samples/s/p 4:57:34 } +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 874/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7962087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43338 samples/s/p 4:57:34 } +2024-07-25 20:11:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 876/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.7958902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43368 samples/s/p 4:57:30 } +2024-07-25 20:11:11,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 878/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 2.7955713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:11,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43115 samples/s/p 4:57:35 } +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 880/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7952523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43597 samples/s/p 4:57:16 } +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 882/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.794933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43687 samples/s/p 4:57:10 } +2024-07-25 20:11:20,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 884/ 1625], loss: 1.304, per_step_time: 1476ms, lr: 2.7946136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.41678 samples/s/p 4:58:14 } +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 886/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.7942939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43777 samples/s/p 4:57:02 } +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 888/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.7939739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.42928 samples/s/p 4:57:26 } +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 890/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7936538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43435 samples/s/p 4:57:07 } +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 892/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7933336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43309 samples/s/p 4:57:08 } +2024-07-25 20:11:35,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 894/ 1625], loss: 1.138, per_step_time: 1469ms, lr: 2.7930128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.44275 samples/s/p 4:56:33 } +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 896/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.7926919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43222 samples/s/p 4:57:05 } +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 898/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 2.7923708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43115 samples/s/p 4:57:06 } +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 900/ 1625], loss: 1.450, per_step_time: 1471ms, lr: 2.7920494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43547 samples/s/p 4:56:48 } +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7917278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43741 samples/s/p 4:56:39 } +2024-07-25 20:11:49,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 904/ 1625], loss: 1.411, per_step_time: 1472ms, lr: 2.791406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43324 samples/s/p 4:56:50 } +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 906/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 2.791084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43963 samples/s/p 4:56:26 } +2024-07-25 20:11:55,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 908/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 2.7907618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:55,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43792 samples/s/p 4:56:29 } +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 910/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.7904392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43896 samples/s/p 4:56:22 } +2024-07-25 20:12:01,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 912/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.7901167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:01,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.42812 samples/s/p 4:56:55 } +2024-07-25 20:12:04,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 914/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.7897937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:04,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43862 samples/s/p 4:56:18 } +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 916/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.7894706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43165 samples/s/p 4:56:37 } +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 918/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7891474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43259 samples/s/p 4:56:31 } +2024-07-25 20:12:13,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 920/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.7888234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43917 samples/s/p 4:56:07 } +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 922/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7884998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43193 samples/s/p 4:56:28 } +2024-07-25 20:12:19,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 924/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.7881757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:19,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43831 samples/s/p 4:56:04 } +2024-07-25 20:12:22,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 926/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.7878514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43597 samples/s/p 4:56:09 } +2024-07-25 20:12:25,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 928/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7875269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43618 samples/s/p 4:56:05 } +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 930/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 2.7872022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43637 samples/s/p 4:56:01 } +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 932/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.7868771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43563 samples/s/p 4:56:01 } +2024-07-25 20:12:34,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 934/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.7865519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43972 samples/s/p 4:55:45 } +2024-07-25 20:12:36,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 936/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.7862265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43809 samples/s/p 4:55:47 } +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 938/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.7859009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43366 samples/s/p 4:55:58 } +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 940/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.7855749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43690 samples/s/p 4:55:45 } +2024-07-25 20:12:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 942/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.7852488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:45,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43583 samples/s/p 4:55:45 } +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 944/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.7849223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43659 samples/s/p 4:55:40 } +2024-07-25 20:12:51,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 946/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 2.7845957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43894 samples/s/p 4:55:29 } +2024-07-25 20:12:54,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 948/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.7842689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:54,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43156 samples/s/p 4:55:51 } +2024-07-25 20:12:57,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 950/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.7839418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:57,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43712 samples/s/p 4:55:29 } +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 952/ 1625], loss: 1.211, per_step_time: 2415ms, lr: 2.7836148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 3.31171 samples/s/p 8:05:04 } +2024-07-25 20:13:35,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 954/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.783287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:35,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43433 samples/s/p 4:55:33 } +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 956/ 1625], loss: 1.364, per_step_time: 1472ms, lr: 2.7829592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43365 samples/s/p 4:55:32 } +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 958/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.7826314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.44050 samples/s/p 4:55:07 } +2024-07-25 20:13:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 960/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 2.7823033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:44,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43465 samples/s/p 4:55:23 } +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 962/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.7819746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43911 samples/s/p 4:55:05 } +2024-07-25 20:13:50,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 964/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.7816463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:50,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43181 samples/s/p 4:55:26 } +2024-07-25 20:13:53,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 966/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.7813174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:53,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43657 samples/s/p 4:55:08 } +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 968/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.780988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43983 samples/s/p 4:54:54 } +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 970/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.7806589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43628 samples/s/p 4:55:03 } +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 972/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.7803293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43210 samples/s/p 4:55:13 } +2024-07-25 20:14:05,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 974/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7799997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:05,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43251 samples/s/p 4:55:09 } +2024-07-25 20:14:08,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 976/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.7796697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:08,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43273 samples/s/p 4:55:06 } +2024-07-25 20:14:11,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 978/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.7793394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43417 samples/s/p 4:54:58 } +2024-07-25 20:14:14,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 980/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.7790089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43643 samples/s/p 4:54:48 } +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 982/ 1625], loss: 0.806, per_step_time: 1471ms, lr: 2.7786784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43543 samples/s/p 4:54:48 } +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 984/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.7783473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43705 samples/s/p 4:54:40 } +2024-07-25 20:14:23,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 986/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 2.7780163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:23,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.44011 samples/s/p 4:54:27 } +2024-07-25 20:14:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 988/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7776849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43808 samples/s/p 4:54:30 } +2024-07-25 20:14:29,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 990/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 2.7773533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:29,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43863 samples/s/p 4:54:26 } +2024-07-25 20:14:32,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 992/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.7770213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:32,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43226 samples/s/p 4:54:43 } +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 994/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7766893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43423 samples/s/p 4:54:34 } +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 996/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.7763572e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43540 samples/s/p 4:54:27 } +2024-07-25 20:14:40,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 998/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 2.7760247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:40,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43898 samples/s/p 4:54:13 } +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1000/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.7756918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43246 samples/s/p 4:54:31 } +2024-07-25 20:14:46,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1002/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.775359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:46,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43851 samples/s/p 4:54:08 } +2024-07-25 20:14:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1004/ 1625], loss: 1.410, per_step_time: 1470ms, lr: 2.775026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:49,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.44188 samples/s/p 4:53:55 } +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1006/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.7746924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43936 samples/s/p 4:54:00 } +2024-07-25 20:14:55,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1008/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 2.7743588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.42746 samples/s/p 4:54:36 } +2024-07-25 20:14:58,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1010/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.774025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:58,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43934 samples/s/p 4:53:54 } +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1012/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.7736909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43245 samples/s/p 4:54:13 } +2024-07-25 20:15:04,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1014/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.7733566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:04,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.44058 samples/s/p 4:53:44 } +2024-07-25 20:15:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1016/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.7730222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:07,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43131 samples/s/p 4:54:11 } +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1018/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.7726874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43361 samples/s/p 4:54:01 } +2024-07-25 20:15:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1020/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.7723525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:13,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43943 samples/s/p 4:53:39 } +2024-07-25 20:15:16,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1022/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.7720173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43478 samples/s/p 4:53:51 } +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1024/ 1625], loss: 1.382, per_step_time: 1474ms, lr: 2.7716818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42613 samples/s/p 4:54:16 } +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1026/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.771346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43100 samples/s/p 4:53:57 } +2024-07-25 20:15:25,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1028/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.7710103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43504 samples/s/p 4:53:41 } +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1030/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.7706741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42859 samples/s/p 4:53:59 } +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1032/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.7703378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.44193 samples/s/p 4:53:13 } +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1034/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7700013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43537 samples/s/p 4:53:32 } +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.7696644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43973 samples/s/p 4:53:14 } +2024-07-25 20:15:39,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1038/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.7693275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43526 samples/s/p 4:53:26 } +2024-07-25 20:15:42,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1040/ 1625], loss: 1.193, per_step_time: 1474ms, lr: 2.7689903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42478 samples/s/p 4:53:57 } +2024-07-25 20:15:45,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1042/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.7686527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:45,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43838 samples/s/p 4:53:10 } +2024-07-25 20:15:48,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1044/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.768315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:48,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42950 samples/s/p 4:53:36 } +2024-07-25 20:15:51,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1046/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.7679771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43576 samples/s/p 4:53:13 } +2024-07-25 20:15:54,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1048/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.7676391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:54,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43686 samples/s/p 4:53:06 } +2024-07-25 20:15:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1050/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7673008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43610 samples/s/p 4:53:06 } +2024-07-25 20:16:00,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1052/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.766962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43287 samples/s/p 4:53:13 } +2024-07-25 20:16:03,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1054/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.7666232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43802 samples/s/p 4:52:54 } +2024-07-25 20:16:06,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1056/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.766284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:06,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43008 samples/s/p 4:53:16 } +2024-07-25 20:16:09,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1058/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.765945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:09,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43794 samples/s/p 4:52:48 } +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1060/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.7656057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42825 samples/s/p 4:53:16 } +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1062/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.7652659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43109 samples/s/p 4:53:04 } +2024-07-25 20:16:18,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1064/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.764926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43012 samples/s/p 4:53:04 } +2024-07-25 20:16:21,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1066/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 2.764586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:21,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43682 samples/s/p 4:52:40 } +2024-07-25 20:16:24,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1068/ 1625], loss: 1.314, per_step_time: 1473ms, lr: 2.7642454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.42764 samples/s/p 4:53:07 } +2024-07-25 20:16:27,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1070/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.763905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43739 samples/s/p 4:52:32 } +2024-07-25 20:16:30,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1072/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.763564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:30,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43221 samples/s/p 4:52:46 } +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1074/ 1625], loss: 1.086, per_step_time: 1482ms, lr: 2.7632228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.39712 samples/s/p 4:54:37 } +2024-07-25 20:16:36,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1076/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.7628816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:36,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43619 samples/s/p 4:52:27 } +2024-07-25 20:16:38,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1078/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 2.7625401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43811 samples/s/p 4:52:18 } +2024-07-25 20:16:41,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1080/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.7621985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:41,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43662 samples/s/p 4:52:20 } +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1082/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7618566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43647 samples/s/p 4:52:17 } +2024-07-25 20:16:47,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1084/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7615144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:47,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43659 samples/s/p 4:52:14 } +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1086/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 2.7611719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43958 samples/s/p 4:52:01 } +2024-07-25 20:16:53,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1088/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 2.7608294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42643 samples/s/p 4:52:41 } +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1090/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.7604865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43590 samples/s/p 4:52:07 } +2024-07-25 20:16:59,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1092/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.7601433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43433 samples/s/p 4:52:10 } +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1094/ 1625], loss: 1.117, per_step_time: 1475ms, lr: 2.7598004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42269 samples/s/p 4:52:44 } +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1096/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7594568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43336 samples/s/p 4:52:07 } +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1098/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.759113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43560 samples/s/p 4:51:57 } +2024-07-25 20:17:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1100/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.758769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43733 samples/s/p 4:51:48 } +2024-07-25 20:17:14,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1102/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7584249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43144 samples/s/p 4:52:04 } +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1104/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 2.7580805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:17,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43558 samples/s/p 4:51:48 } +2024-07-25 20:17:20,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1106/ 1625], loss: 1.127, per_step_time: 1482ms, lr: 2.7577358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.39535 samples/s/p 4:53:55 } +2024-07-25 20:17:23,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1108/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.7573911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:23,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.42939 samples/s/p 4:52:02 } +2024-07-25 20:17:26,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1110/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.7570459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43452 samples/s/p 4:51:42 } +2024-07-25 20:17:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1112/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7567006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43823 samples/s/p 4:51:28 } +2024-07-25 20:17:32,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1114/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.756355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:32,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43675 samples/s/p 4:51:29 } +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1116/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.7560092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.44096 samples/s/p 4:51:13 } +2024-07-25 20:17:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1118/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 2.7556633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42928 samples/s/p 4:51:48 } +2024-07-25 20:17:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1120/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.7553173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:40,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43437 samples/s/p 4:51:28 } +2024-07-25 20:17:43,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1122/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 2.7549708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42728 samples/s/p 4:51:48 } +2024-07-25 20:17:46,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1124/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.754624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:46,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42969 samples/s/p 4:51:37 } +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1126/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.7542774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43117 samples/s/p 4:51:30 } +2024-07-25 20:17:52,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1128/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.7539303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:52,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43359 samples/s/p 4:51:19 } +2024-07-25 20:17:55,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1130/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.7535827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44008 samples/s/p 4:50:55 } +2024-07-25 20:17:58,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1132/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 2.7532353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44248 samples/s/p 4:50:44 } +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1134/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 2.7528875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43785 samples/s/p 4:50:56 } +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1136/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7525399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43448 samples/s/p 4:51:04 } +2024-07-25 20:18:07,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1138/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.7521915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:07,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43216 samples/s/p 4:51:09 } +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1140/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.751843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43519 samples/s/p 4:50:56 } +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1142/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.7514943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43640 samples/s/p 4:50:49 } +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1144/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.7511456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43436 samples/s/p 4:50:53 } +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1146/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 2.7507964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43800 samples/s/p 4:50:38 } +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1148/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.7504475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43598 samples/s/p 4:50:42 } +2024-07-25 20:18:25,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1150/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 2.7500977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:25,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43060 samples/s/p 4:50:56 } +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1152/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 2.7497483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43943 samples/s/p 4:50:25 } +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1154/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 2.749398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44305 samples/s/p 4:50:10 } +2024-07-25 20:18:34,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1156/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 2.7490478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:34,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43946 samples/s/p 4:50:19 } +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1158/ 1625], loss: 1.337, per_step_time: 1473ms, lr: 2.7486976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.42991 samples/s/p 4:50:47 } +2024-07-25 20:18:39,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1160/ 1625], loss: 1.276, per_step_time: 1470ms, lr: 2.7483471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43880 samples/s/p 4:50:15 } +2024-07-25 20:18:42,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1162/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.7479962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43337 samples/s/p 4:50:30 } +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1164/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.747645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43012 samples/s/p 4:50:37 } +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1166/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.7472937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43517 samples/s/p 4:50:18 } +2024-07-25 20:18:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1168/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.7469421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42802 samples/s/p 4:50:38 } +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1170/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.7465905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43595 samples/s/p 4:50:10 } +2024-07-25 20:18:57,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1172/ 1625], loss: 1.286, per_step_time: 1475ms, lr: 2.7462385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:57,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42302 samples/s/p 4:50:48 } +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1174/ 1625], loss: 1.341, per_step_time: 1473ms, lr: 2.7458864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:00,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42922 samples/s/p 4:50:25 } +2024-07-25 20:19:03,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1176/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 2.745534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:03,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43160 samples/s/p 4:50:15 } +2024-07-25 20:19:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1178/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 2.7451813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42936 samples/s/p 4:50:19 } +2024-07-25 20:19:09,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1180/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.7448285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:09,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43265 samples/s/p 4:50:05 } +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1182/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7444756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43294 samples/s/p 4:50:01 } +2024-07-25 20:19:15,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.7441221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43642 samples/s/p 4:49:47 } +2024-07-25 20:19:18,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1186/ 1625], loss: 1.384, per_step_time: 1471ms, lr: 2.7437689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43662 samples/s/p 4:49:44 } +2024-07-25 20:19:21,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1188/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.7434153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:21,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43670 samples/s/p 4:49:41 } +2024-07-25 20:19:24,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1190/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.7430611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:24,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.44050 samples/s/p 4:49:26 } +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1192/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.742707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43162 samples/s/p 4:49:51 } +2024-07-25 20:19:30,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1194/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.7423526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.42999 samples/s/p 4:49:53 } +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1196/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.7419981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43265 samples/s/p 4:49:42 } +2024-07-25 20:19:36,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1198/ 1625], loss: 1.360, per_step_time: 1474ms, lr: 2.7416432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42604 samples/s/p 4:50:00 } +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1200/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.7412882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43101 samples/s/p 4:49:41 } +2024-07-25 20:19:42,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1202/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.740933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:42,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43405 samples/s/p 4:49:29 } +2024-07-25 20:19:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1204/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.7405775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:44,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43547 samples/s/p 4:49:21 } +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1206/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.7402219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43177 samples/s/p 4:49:30 } +2024-07-25 20:19:50,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1208/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.7398659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:50,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43397 samples/s/p 4:49:20 } +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1210/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 2.7395097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43040 samples/s/p 4:49:28 } +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1212/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 2.7391534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43768 samples/s/p 4:49:02 } +2024-07-25 20:19:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1214/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.7387967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.42928 samples/s/p 4:49:26 } +2024-07-25 20:20:02,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1216/ 1625], loss: 0.958, per_step_time: 1469ms, lr: 2.73844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.44491 samples/s/p 4:48:33 } +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1218/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.7380831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43439 samples/s/p 4:49:04 } +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1220/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.7377257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43780 samples/s/p 4:48:50 } +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1222/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7373682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43315 samples/s/p 4:49:02 } +2024-07-25 20:20:14,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1224/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.7370106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:14,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43609 samples/s/p 4:48:50 } +2024-07-25 20:20:17,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1226/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.7366526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:17,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43359 samples/s/p 4:48:55 } +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1228/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.7362947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43563 samples/s/p 4:48:45 } +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1230/ 1625], loss: 1.338, per_step_time: 1469ms, lr: 2.7359361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.44236 samples/s/p 4:48:21 } +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1232/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.7355776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43353 samples/s/p 4:48:46 } +2024-07-25 20:20:29,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1234/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.735219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:29,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43887 samples/s/p 4:48:26 } +2024-07-25 20:20:32,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1236/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.73486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:32,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43524 samples/s/p 4:48:35 } +2024-07-25 20:20:35,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1238/ 1625], loss: 1.128, per_step_time: 1473ms, lr: 2.734501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.42796 samples/s/p 4:48:55 } +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1240/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.7341417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43289 samples/s/p 4:48:36 } +2024-07-25 20:20:41,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1242/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.733782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:41,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43733 samples/s/p 4:48:19 } +2024-07-25 20:20:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1244/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.7334221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43115 samples/s/p 4:48:36 } +2024-07-25 20:20:46,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1246/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.733062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43680 samples/s/p 4:48:15 } +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1248/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.7327018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.42999 samples/s/p 4:48:34 } +2024-07-25 20:20:52,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1250/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.732341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:52,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43196 samples/s/p 4:48:24 } +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1252/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.7319802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43792 samples/s/p 4:48:03 } +2024-07-25 20:20:58,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1254/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7316195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:58,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43372 samples/s/p 4:48:13 } +2024-07-25 20:21:01,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1256/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.7312582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:01,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43782 samples/s/p 4:47:57 } +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1258/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.7308968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43688 samples/s/p 4:47:57 } +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1260/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 2.7305352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43997 samples/s/p 4:47:44 } +2024-07-25 20:21:10,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1262/ 1625], loss: 0.940, per_step_time: 1470ms, lr: 2.7301734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:10,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.44020 samples/s/p 4:47:41 } +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1264/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.7298112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.44001 samples/s/p 4:47:38 } +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1266/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.729449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43560 samples/s/p 4:47:49 } +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1268/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.729087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43933 samples/s/p 4:47:35 } +2024-07-25 20:21:22,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1270/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.728724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43364 samples/s/p 4:47:50 } +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1272/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.7283611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43582 samples/s/p 4:47:40 } +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1274/ 1625], loss: 1.105, per_step_time: 1482ms, lr: 2.727998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.39490 samples/s/p 4:49:48 } +2024-07-25 20:21:31,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1276/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.7276346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43557 samples/s/p 4:47:35 } +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1278/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.7272712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43447 samples/s/p 4:47:35 } +2024-07-25 20:21:37,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1280/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.7269074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:37,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43415 samples/s/p 4:47:33 } +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1282/ 1625], loss: 0.872, per_step_time: 1470ms, lr: 2.7265432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43859 samples/s/p 4:47:16 } +2024-07-25 20:21:43,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1284/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.7261793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:43,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43674 samples/s/p 4:47:19 } +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1286/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.725815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43255 samples/s/p 4:47:30 } +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1288/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.7254502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.42932 samples/s/p 4:47:37 } +2024-07-25 20:21:51,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1290/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.7250853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:51,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.44145 samples/s/p 4:46:55 } +2024-07-25 20:21:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1292/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.72472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.42676 samples/s/p 4:47:39 } +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1294/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.7243548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43127 samples/s/p 4:47:22 } +2024-07-25 20:22:00,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1296/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7239892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43513 samples/s/p 4:47:07 } +2024-07-25 20:22:03,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1298/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 2.7236234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:03,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43907 samples/s/p 4:46:51 } +2024-07-25 20:22:06,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1300/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.7232578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43424 samples/s/p 4:47:04 } +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1302/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.7228914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43812 samples/s/p 4:46:48 } +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1304/ 1625], loss: 1.342, per_step_time: 1477ms, lr: 2.7225251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.41558 samples/s/p 4:47:57 } +2024-07-25 20:22:15,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1306/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 2.7221586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43665 samples/s/p 4:46:47 } +2024-07-25 20:22:18,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1308/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7217915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:18,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43342 samples/s/p 4:46:54 } +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1310/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 2.7214248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:21,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43478 samples/s/p 4:46:47 } +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1312/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.7210575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43547 samples/s/p 4:46:42 } +2024-07-25 20:22:27,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1314/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 2.7206897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:27,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43886 samples/s/p 4:46:28 } +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1316/ 1625], loss: 1.173, per_step_time: 1474ms, lr: 2.7203223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42513 samples/s/p 4:47:09 } +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1318/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.7199543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43661 samples/s/p 4:46:30 } +2024-07-25 20:22:36,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1320/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.7195862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:36,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43687 samples/s/p 4:46:26 } +2024-07-25 20:22:39,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1322/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7192178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:39,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43398 samples/s/p 4:46:32 } +2024-07-25 20:22:42,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1324/ 1625], loss: 1.350, per_step_time: 1473ms, lr: 2.7188493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42856 samples/s/p 4:46:46 } +2024-07-25 20:22:44,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1326/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.7184808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:44,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43758 samples/s/p 4:46:15 } +2024-07-25 20:22:47,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1328/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.7181119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:47,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43800 samples/s/p 4:46:11 } +2024-07-25 20:22:50,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1330/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.7177426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:50,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43393 samples/s/p 4:46:20 } +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1332/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 2.7173732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.44111 samples/s/p 4:45:55 } +2024-07-25 20:22:56,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1334/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7170036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:56,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43612 samples/s/p 4:46:08 } +2024-07-25 20:22:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1336/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7166338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43583 samples/s/p 4:46:06 } +2024-07-25 20:23:02,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1338/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.7162638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:02,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.42754 samples/s/p 4:46:29 } +2024-07-25 20:23:05,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1340/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7158934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:05,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43683 samples/s/p 4:45:57 } +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1342/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7155229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43658 samples/s/p 4:45:54 } +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1344/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.7151524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43738 samples/s/p 4:45:49 } +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1346/ 1625], loss: 0.929, per_step_time: 1472ms, lr: 2.7147813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:14,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43441 samples/s/p 4:45:55 } +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1348/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7144102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43726 samples/s/p 4:45:43 } +2024-07-25 20:23:20,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1350/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.7140388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:20,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43497 samples/s/p 4:45:48 } +2024-07-25 20:23:23,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1352/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.7136673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:23,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43320 samples/s/p 4:45:50 } +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1354/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7132955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43633 samples/s/p 4:45:38 } +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1356/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7129236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43165 samples/s/p 4:45:49 } +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1358/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 2.7125512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.44076 samples/s/p 4:45:18 } +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1360/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.712179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43211 samples/s/p 4:45:42 } +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1362/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.7118065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42889 samples/s/p 4:45:49 } +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1364/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.7114334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43128 samples/s/p 4:45:39 } +2024-07-25 20:23:44,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1366/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 2.7110606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:44,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42849 samples/s/p 4:45:45 } +2024-07-25 20:23:46,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1368/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7106873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43396 samples/s/p 4:45:24 } +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1370/ 1625], loss: 1.202, per_step_time: 1481ms, lr: 2.7103139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.39975 samples/s/p 4:47:10 } +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1372/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.70994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43652 samples/s/p 4:45:10 } +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.709566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43616 samples/s/p 4:45:09 } +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1376/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.7091919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42960 samples/s/p 4:45:26 } +2024-07-25 20:24:01,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1378/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.7088177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:01,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43577 samples/s/p 4:45:04 } +2024-07-25 20:24:04,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1380/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.7084432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:04,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42934 samples/s/p 4:45:21 } +2024-07-25 20:24:07,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1382/ 1625], loss: 1.086, per_step_time: 1483ms, lr: 2.7080683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.39246 samples/s/p 4:47:15 } +2024-07-25 20:24:10,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1384/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.7076932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:10,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43523 samples/s/p 4:44:57 } +2024-07-25 20:24:13,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1386/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7073182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43615 samples/s/p 4:44:51 } +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1388/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.7069427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42979 samples/s/p 4:45:08 } +2024-07-25 20:24:19,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1390/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.706567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:19,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43145 samples/s/p 4:45:00 } +2024-07-25 20:24:22,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1392/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7061913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:22,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42894 samples/s/p 4:45:05 } +2024-07-25 20:24:25,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1394/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 2.7058151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:25,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42508 samples/s/p 4:45:14 } +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1396/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.705439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43658 samples/s/p 4:44:35 } +2024-07-25 20:24:31,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1398/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.7050624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:31,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42888 samples/s/p 4:44:56 } +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1400/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.7046857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.44024 samples/s/p 4:44:18 } +2024-07-25 20:24:37,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1402/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.7043088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:37,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43629 samples/s/p 4:44:27 } +2024-07-25 20:24:40,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1404/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 2.7039318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:40,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43615 samples/s/p 4:44:25 } +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1406/ 1625], loss: 1.244, per_step_time: 1473ms, lr: 2.7035543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:43,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42906 samples/s/p 4:44:44 } +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1408/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.703177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43307 samples/s/p 4:44:28 } +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1410/ 1625], loss: 1.049, per_step_time: 1474ms, lr: 2.702799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42690 samples/s/p 4:44:45 } +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1412/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.7024213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43328 samples/s/p 4:44:22 } +2024-07-25 20:24:54,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1414/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 2.702043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:54,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43780 samples/s/p 4:44:05 } +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.7016647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43566 samples/s/p 4:44:08 } +2024-07-25 20:25:00,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1418/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7012862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43760 samples/s/p 4:43:59 } +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1420/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7009073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43004 samples/s/p 4:44:20 } +2024-07-25 20:25:06,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.7005282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:06,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43357 samples/s/p 4:44:06 } +2024-07-25 20:25:09,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1424/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.700149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:09,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43389 samples/s/p 4:44:02 } +2024-07-25 20:25:12,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1426/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.6997694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:12,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43798 samples/s/p 4:43:46 } +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1428/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6993897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43235 samples/s/p 4:44:01 } +2024-07-25 20:25:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1430/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.69901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43568 samples/s/p 4:43:48 } +2024-07-25 20:25:21,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1432/ 1625], loss: 1.159, per_step_time: 1475ms, lr: 2.69863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:21,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42176 samples/s/p 4:44:29 } +2024-07-25 20:25:24,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1434/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.6982496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:24,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43435 samples/s/p 4:43:46 } +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1436/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.697869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42812 samples/s/p 4:44:03 } +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1438/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.6974883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.44066 samples/s/p 4:43:20 } +2024-07-25 20:25:33,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1440/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.6971074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43301 samples/s/p 4:43:41 } +2024-07-25 20:25:36,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1442/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.6967262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:36,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43750 samples/s/p 4:43:24 } +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1444/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.6963447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43214 samples/s/p 4:43:38 } +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1446/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.6959635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43295 samples/s/p 4:43:33 } +2024-07-25 20:25:45,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1448/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.6955817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:45,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43567 samples/s/p 4:43:21 } +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1450/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.6951997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43698 samples/s/p 4:43:14 } +2024-07-25 20:25:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1452/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.6948175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:50,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43980 samples/s/p 4:43:02 } +2024-07-25 20:25:53,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1454/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.6944352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43777 samples/s/p 4:43:06 } +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1456/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 2.6940525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.44304 samples/s/p 4:42:46 } +2024-07-25 20:25:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1458/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.6936696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43255 samples/s/p 4:43:16 } +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1460/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.6932865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43580 samples/s/p 4:43:03 } +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1462/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 2.6929032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43893 samples/s/p 4:42:50 } +2024-07-25 20:26:08,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1464/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.69252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:08,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42694 samples/s/p 4:43:25 } +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1466/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.6921361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42980 samples/s/p 4:43:13 } +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1468/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.6917522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43493 samples/s/p 4:42:54 } +2024-07-25 20:26:17,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1470/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.691368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:17,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43415 samples/s/p 4:42:54 } +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1472/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 2.6909836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43099 samples/s/p 4:43:01 } +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1474/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.6905991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43630 samples/s/p 4:42:41 } +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1476/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6902144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43318 samples/s/p 4:42:48 } +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1478/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.6898295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43067 samples/s/p 4:42:53 } +2024-07-25 20:26:32,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1480/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 2.6894442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.44314 samples/s/p 4:42:11 } +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1482/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.689059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43415 samples/s/p 4:42:36 } +2024-07-25 20:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1484/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6886732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43482 samples/s/p 4:42:31 } +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1486/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.6882875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43969 samples/s/p 4:42:13 } +2024-07-25 20:26:44,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1488/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.6879015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:44,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43370 samples/s/p 4:42:29 } +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1490/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.6875154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43446 samples/s/p 4:42:23 } +2024-07-25 20:26:50,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 2.687129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:50,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.42972 samples/s/p 4:42:35 } +2024-07-25 20:26:52,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1494/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.6867421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:52,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43653 samples/s/p 4:42:11 } +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1496/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.6863554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43937 samples/s/p 4:41:59 } +2024-07-25 20:26:58,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1498/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.6859683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:58,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43436 samples/s/p 4:42:12 } +2024-07-25 20:27:01,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1500/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.685581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:01,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43643 samples/s/p 4:42:02 } +2024-07-25 20:27:04,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1502/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.6851938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:04,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43744 samples/s/p 4:41:56 } +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1504/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.6848062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43405 samples/s/p 4:42:04 } +2024-07-25 20:27:10,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1506/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.6844182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:10,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43551 samples/s/p 4:41:56 } +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1508/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.68403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43669 samples/s/p 4:41:50 } +2024-07-25 20:27:16,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1510/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 2.6836418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.42908 samples/s/p 4:42:11 } +2024-07-25 20:27:19,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1512/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6832533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43069 samples/s/p 4:42:03 } +2024-07-25 20:27:22,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1514/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.6828646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:22,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43530 samples/s/p 4:41:45 } +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1516/ 1625], loss: 1.383, per_step_time: 1469ms, lr: 2.6824755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.44243 samples/s/p 4:41:20 } +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1518/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.6820864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43816 samples/s/p 4:41:30 } +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1520/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6816972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43267 samples/s/p 4:41:45 } +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.6813075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42545 samples/s/p 4:42:04 } +2024-07-25 20:27:37,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1524/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.6809177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42854 samples/s/p 4:41:52 } +2024-07-25 20:27:40,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1526/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.6805277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:40,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43313 samples/s/p 4:41:34 } +2024-07-25 20:27:43,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1528/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 2.6801375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:43,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.44003 samples/s/p 4:41:10 } +2024-07-25 20:27:46,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1530/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.679747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:46,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42864 samples/s/p 4:41:42 } +2024-07-25 20:27:49,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1532/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.6793565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43451 samples/s/p 4:41:21 } +2024-07-25 20:27:51,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1534/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6789658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43480 samples/s/p 4:41:17 } +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1536/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6785747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43244 samples/s/p 4:41:22 } +2024-07-25 20:27:57,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1538/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.6781836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:57,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.42462 samples/s/p 4:41:43 } +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1540/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.6777923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43689 samples/s/p 4:41:02 } +2024-07-25 20:28:03,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1542/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.6774005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43936 samples/s/p 4:40:51 } +2024-07-25 20:28:06,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1544/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.6770087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43814 samples/s/p 4:40:52 } +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1546/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.6766167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43280 samples/s/p 4:41:06 } +2024-07-25 20:28:12,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1548/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.6762244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43328 samples/s/p 4:41:02 } +2024-07-25 20:28:15,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1550/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.675832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43304 samples/s/p 4:40:59 } +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1552/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6754393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43765 samples/s/p 4:40:42 } +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1554/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.6750464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.42876 samples/s/p 4:41:07 } +2024-07-25 20:28:24,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1556/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.6746531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43908 samples/s/p 4:40:32 } +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1558/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.67426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43599 samples/s/p 4:40:38 } +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1560/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.6738662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43797 samples/s/p 4:40:29 } +2024-07-25 20:28:33,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1562/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.6734724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:33,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43918 samples/s/p 4:40:23 } +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1564/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 2.6730788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.44047 samples/s/p 4:40:16 } +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1566/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.6726846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43579 samples/s/p 4:40:27 } +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1568/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.67229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43800 samples/s/p 4:40:17 } +2024-07-25 20:28:45,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1570/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.6718957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:45,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43403 samples/s/p 4:40:27 } +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1572/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.671501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43158 samples/s/p 4:40:31 } +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1574/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.6711057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43602 samples/s/p 4:40:15 } +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1576/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 2.6707106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:53,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.42666 samples/s/p 4:40:41 } +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1578/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.6703154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43931 samples/s/p 4:39:59 } +2024-07-25 20:28:59,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1580/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6699196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:59,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43534 samples/s/p 4:40:08 } +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1582/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.6695237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44132 samples/s/p 4:39:47 } +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1584/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 2.669128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44045 samples/s/p 4:39:46 } +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1586/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.6687318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43509 samples/s/p 4:40:00 } +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1588/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.6683352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43556 samples/s/p 4:39:56 } +2024-07-25 20:29:14,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1590/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.6679389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:14,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43778 samples/s/p 4:39:46 } +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1592/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.667542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43398 samples/s/p 4:39:55 } +2024-07-25 20:29:20,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1594/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.667145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43154 samples/s/p 4:39:59 } +2024-07-25 20:29:23,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1596/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 2.6667478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43288 samples/s/p 4:39:52 } +2024-07-25 20:29:26,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1598/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6663502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:26,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43538 samples/s/p 4:39:41 } +2024-07-25 20:29:29,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1600/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.6659527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:29,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43813 samples/s/p 4:39:30 } +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1602/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 2.6655547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43065 samples/s/p 4:39:50 } +2024-07-25 20:29:35,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1604/ 1625], loss: 1.150, per_step_time: 1481ms, lr: 2.6651567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:35,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.39854 samples/s/p 4:41:27 } +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1606/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 2.6647582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.42775 samples/s/p 4:39:53 } +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1608/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.66436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43321 samples/s/p 4:39:33 } +2024-07-25 20:29:44,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1610/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6639615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43546 samples/s/p 4:39:23 } +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1612/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6635624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43797 samples/s/p 4:39:13 } +2024-07-25 20:29:50,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1614/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.6631631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:50,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43179 samples/s/p 4:39:29 } +2024-07-25 20:29:53,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1616/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.6627638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:53,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43309 samples/s/p 4:39:22 } +2024-07-25 20:29:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1618/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.6623644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43771 samples/s/p 4:39:05 } +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1620/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.6619646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43289 samples/s/p 4:39:17 } +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1622/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.6615648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43304 samples/s/p 4:39:13 } +2024-07-25 20:30:04,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1624/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.661165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:04,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43738 samples/s/p 4:38:57 } +2024-07-25 20:30:07,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.6607646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43486 samples/s/p 4:39:02 } +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 3/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.660364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43797 samples/s/p 4:38:49 } +2024-07-25 20:30:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 5/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6599633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:13,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43808 samples/s/p 4:38:46 } +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 7/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.6595622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.44002 samples/s/p 4:38:37 } +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 9/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.6591613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43543 samples/s/p 4:38:48 } +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 11/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.6587599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43776 samples/s/p 4:38:38 } +2024-07-25 20:30:25,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 13/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.6583582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:25,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.42896 samples/s/p 4:39:02 } +2024-07-25 20:30:28,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 15/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6579564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43750 samples/s/p 4:38:33 } +2024-07-25 20:30:31,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 17/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.6575546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43538 samples/s/p 4:38:37 } +2024-07-25 20:30:34,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 19/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6571523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:34,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43315 samples/s/p 4:38:41 } +2024-07-25 20:30:37,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 21/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.6567499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43793 samples/s/p 4:38:23 } +2024-07-25 20:30:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 23/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6563475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43352 samples/s/p 4:38:34 } +2024-07-25 20:30:43,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 25/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.6559446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43247 samples/s/p 4:38:34 } +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 27/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6555417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43550 samples/s/p 4:38:22 } +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 29/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.6551385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43497 samples/s/p 4:38:20 } +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 31/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 2.654735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43875 samples/s/p 4:38:06 } +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 33/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 2.6543314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43816 samples/s/p 4:38:05 } +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 35/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.6539275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43454 samples/s/p 4:38:13 } +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 37/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.6535236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43427 samples/s/p 4:38:11 } +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 39/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.6531194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43499 samples/s/p 4:38:05 } +2024-07-25 20:31:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 41/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.652715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:06,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43256 samples/s/p 4:38:10 } +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 43/ 1625], loss: 1.054, per_step_time: 1473ms, lr: 2.6523103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.42944 samples/s/p 4:38:17 } +2024-07-25 20:31:12,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 45/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.6519056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:12,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43567 samples/s/p 4:37:55 } +2024-07-25 20:31:15,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 47/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.6515005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:15,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43528 samples/s/p 4:37:53 } +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 49/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.6510952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43156 samples/s/p 4:38:01 } +2024-07-25 20:31:21,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 51/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.6506901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:21,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43592 samples/s/p 4:37:45 } +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 53/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.6502841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43896 samples/s/p 4:37:33 } +2024-07-25 20:31:27,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 55/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 2.6498787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:27,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43051 samples/s/p 4:37:56 } +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 57/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.6494725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43335 samples/s/p 4:37:44 } +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 59/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 2.6490663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43253 samples/s/p 4:37:44 } +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 61/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.64866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44135 samples/s/p 4:37:14 } +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 63/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6482532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43261 samples/s/p 4:37:37 } +2024-07-25 20:31:42,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 65/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.6478463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:42,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43631 samples/s/p 4:37:23 } +2024-07-25 20:31:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 67/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.6474394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43043 samples/s/p 4:37:38 } +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 69/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 2.6470321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43911 samples/s/p 4:37:09 } +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 71/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 2.6466245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44175 samples/s/p 4:36:58 } +2024-07-25 20:31:53,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 73/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 2.6462169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:53,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44019 samples/s/p 4:37:00 } +2024-07-25 20:31:56,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 75/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.645809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:56,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43830 samples/s/p 4:37:02 } +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 77/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.645401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43644 samples/s/p 4:37:05 } +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 79/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.6449929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43285 samples/s/p 4:37:13 } +2024-07-25 20:32:05,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 81/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.6445841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:05,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43236 samples/s/p 4:37:12 } +2024-07-25 20:32:08,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 83/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.6441756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43829 samples/s/p 4:36:51 } +2024-07-25 20:32:11,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 85/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 2.6437665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:11,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43483 samples/s/p 4:36:58 } +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 87/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.6433578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43463 samples/s/p 4:36:56 } +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 89/ 1625], loss: 0.988, per_step_time: 1472ms, lr: 2.6429483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:17,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43377 samples/s/p 4:36:56 } +2024-07-25 20:32:20,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 91/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.642539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:20,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43672 samples/s/p 4:36:44 } +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 93/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.6421292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43369 samples/s/p 4:36:50 } +2024-07-25 20:32:26,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 95/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.6417194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:26,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43810 samples/s/p 4:36:34 } +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 97/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.6413092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43379 samples/s/p 4:36:44 } +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 99/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.640899e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43658 samples/s/p 4:36:32 } +2024-07-25 20:32:35,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 101/ 1625], loss: 1.247, per_step_time: 1469ms, lr: 2.6404885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:35,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.44239 samples/s/p 4:36:12 } +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 103/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.640078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43328 samples/s/p 4:36:36 } +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 105/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.639667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43153 samples/s/p 4:36:39 } +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 107/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.639256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43800 samples/s/p 4:36:16 } +2024-07-25 20:32:47,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 109/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6388447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:47,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43626 samples/s/p 4:36:19 } +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 111/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.6384332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.44274 samples/s/p 4:35:56 } +2024-07-25 20:32:52,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 113/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.6380214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:52,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43714 samples/s/p 4:36:10 } +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 115/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.6376096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43180 samples/s/p 4:36:23 } +2024-07-25 20:32:58,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 117/ 1625], loss: 1.172, per_step_time: 1474ms, lr: 2.6371974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:58,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42541 samples/s/p 4:36:40 } +2024-07-25 20:33:01,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 119/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.6367852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42513 samples/s/p 4:36:38 } +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 121/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.6363727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43432 samples/s/p 4:36:07 } +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 123/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 2.63596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43876 samples/s/p 4:35:50 } +2024-07-25 20:33:10,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 125/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.635547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:10,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43631 samples/s/p 4:35:55 } +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 127/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.635134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43152 samples/s/p 4:36:06 } +2024-07-25 20:33:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 129/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6347207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.44062 samples/s/p 4:35:36 } +2024-07-25 20:33:19,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 131/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.6343072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43619 samples/s/p 4:35:46 } +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 133/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.6338936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43739 samples/s/p 4:35:40 } +2024-07-25 20:33:25,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 135/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.6334796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:25,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43007 samples/s/p 4:35:59 } +2024-07-25 20:33:28,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 137/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.6330656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:28,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43882 samples/s/p 4:35:30 } +2024-07-25 20:33:31,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 139/ 1625], loss: 1.209, per_step_time: 1474ms, lr: 2.632651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.42519 samples/s/p 4:36:08 } +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 141/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.6322365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43777 samples/s/p 4:35:27 } +2024-07-25 20:33:37,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 143/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.6318221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43691 samples/s/p 4:35:27 } +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 145/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.631407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43134 samples/s/p 4:35:41 } +2024-07-25 20:33:43,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 147/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.6309921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:43,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43456 samples/s/p 4:35:28 } +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 149/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 2.6305768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43597 samples/s/p 4:35:21 } +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 151/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.6301614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43835 samples/s/p 4:35:10 } +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 153/ 1625], loss: 1.080, per_step_time: 1469ms, lr: 2.6297457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.44317 samples/s/p 4:34:53 } +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 155/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.6293299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43913 samples/s/p 4:35:02 } +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 157/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 2.6289135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43993 samples/s/p 4:34:57 } +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 159/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.6284974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43645 samples/s/p 4:35:04 } +2024-07-25 20:34:03,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 161/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 2.6280808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43137 samples/s/p 4:35:17 } +2024-07-25 20:34:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 163/ 1625], loss: 1.125, per_step_time: 1474ms, lr: 2.6276643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:06,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42432 samples/s/p 4:35:35 } +2024-07-25 20:34:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 165/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.6272473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43954 samples/s/p 4:34:46 } +2024-07-25 20:34:12,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 167/ 1625], loss: 1.246, per_step_time: 1474ms, lr: 2.6268302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:12,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42413 samples/s/p 4:35:30 } +2024-07-25 20:34:15,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 169/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.6264128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42858 samples/s/p 4:35:14 } +2024-07-25 20:34:18,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 171/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.6259953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:18,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43540 samples/s/p 4:34:50 } +2024-07-25 20:34:21,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 173/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.6255777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:21,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43483 samples/s/p 4:34:49 } +2024-07-25 20:34:24,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 175/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.6251599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43091 samples/s/p 4:34:58 } +2024-07-25 20:34:27,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 177/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.624742e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43528 samples/s/p 4:34:41 } +2024-07-25 20:34:30,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 179/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.6243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:30,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.42999 samples/s/p 4:34:55 } +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 181/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 2.6239051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43594 samples/s/p 4:34:34 } +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 183/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.6234866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43806 samples/s/p 4:34:24 } +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 185/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.6230677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43127 samples/s/p 4:34:42 } +2024-07-25 20:34:42,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 187/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.6226486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:42,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42594 samples/s/p 4:34:55 } +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 189/ 1625], loss: 1.125, per_step_time: 1469ms, lr: 2.6222293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.44472 samples/s/p 4:33:55 } +2024-07-25 20:34:48,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 191/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.6218097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43268 samples/s/p 4:34:29 } +2024-07-25 20:34:51,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 193/ 1625], loss: 1.006, per_step_time: 1473ms, lr: 2.6213902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:51,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43085 samples/s/p 4:34:31 } +2024-07-25 20:34:54,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 195/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.6209704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:54,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43340 samples/s/p 4:34:21 } +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 197/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 2.6205502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42820 samples/s/p 4:34:33 } +2024-07-25 20:34:59,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 199/ 1625], loss: 1.157, per_step_time: 1474ms, lr: 2.6201298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42489 samples/s/p 4:34:41 } +2024-07-25 20:35:02,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 201/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.6197094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:02,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43087 samples/s/p 4:34:19 } +2024-07-25 20:35:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 203/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.6192887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:05,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42938 samples/s/p 4:34:21 } +2024-07-25 20:35:08,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 205/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.618868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43585 samples/s/p 4:33:58 } +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 207/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.618447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43583 samples/s/p 4:33:56 } +2024-07-25 20:35:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 209/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.6180256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:14,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43777 samples/s/p 4:33:47 } +2024-07-25 20:35:17,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 211/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 2.6176042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:17,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43626 samples/s/p 4:33:48 } +2024-07-25 20:35:20,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 213/ 1625], loss: 1.308, per_step_time: 1470ms, lr: 2.6171825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:20,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.44033 samples/s/p 4:33:33 } +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 215/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.6167607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43452 samples/s/p 4:33:48 } +2024-07-25 20:35:26,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 217/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6163387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:26,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43247 samples/s/p 4:33:51 } +2024-07-25 20:35:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 219/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.6159165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43642 samples/s/p 4:33:36 } +2024-07-25 20:35:32,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 221/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.615494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:32,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43654 samples/s/p 4:33:33 } +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 223/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.6150716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43801 samples/s/p 4:33:25 } +2024-07-25 20:35:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 225/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.6146485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43079 samples/s/p 4:33:44 } +2024-07-25 20:35:41,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 227/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.6142256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43833 samples/s/p 4:33:19 } +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 229/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6138026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43673 samples/s/p 4:33:21 } +2024-07-25 20:35:47,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 231/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.613379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:47,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43858 samples/s/p 4:33:12 } +2024-07-25 20:35:50,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 233/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.6129554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43241 samples/s/p 4:33:28 } +2024-07-25 20:35:53,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 235/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.6125317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43665 samples/s/p 4:33:12 } +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.6121077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43622 samples/s/p 4:33:10 } +2024-07-25 20:35:58,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 239/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.6116835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43514 samples/s/p 4:33:11 } +2024-07-25 20:36:01,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 241/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.611259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43686 samples/s/p 4:33:02 } +2024-07-25 20:36:04,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 243/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 2.6108346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:04,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.42933 samples/s/p 4:33:22 } +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.6104097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43599 samples/s/p 4:32:59 } +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 247/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 2.6099848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43204 samples/s/p 4:33:08 } +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 249/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.6095595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.44016 samples/s/p 4:32:41 } +2024-07-25 20:36:16,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 251/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6091344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:16,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43570 samples/s/p 4:32:51 } +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 253/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.6087086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43721 samples/s/p 4:32:44 } +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 255/ 1625], loss: 1.192, per_step_time: 1475ms, lr: 2.608283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42322 samples/s/p 4:33:23 } +2024-07-25 20:36:25,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 257/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.607857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43841 samples/s/p 4:32:34 } +2024-07-25 20:36:28,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 259/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.6074307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:28,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.44070 samples/s/p 4:32:24 } +2024-07-25 20:36:31,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 261/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 2.6070044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43064 samples/s/p 4:32:52 } +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 263/ 1625], loss: 1.043, per_step_time: 1473ms, lr: 2.6065778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42792 samples/s/p 4:32:57 } +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 265/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.6061514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43693 samples/s/p 4:32:27 } +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 267/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.6057243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43629 samples/s/p 4:32:26 } +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 269/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.6052974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44233 samples/s/p 4:32:05 } +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 271/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 2.6048701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43115 samples/s/p 4:32:36 } +2024-07-25 20:36:49,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 273/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.6044425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43685 samples/s/p 4:32:15 } +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 275/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.6040148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43557 samples/s/p 4:32:16 } +2024-07-25 20:36:54,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 277/ 1625], loss: 1.050, per_step_time: 1469ms, lr: 2.6035868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:54,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44266 samples/s/p 4:31:52 } +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 279/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 2.6031588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.42660 samples/s/p 4:32:37 } +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 281/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.6027305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43400 samples/s/p 4:32:12 } +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 283/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.6023019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43492 samples/s/p 4:32:07 } +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 285/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.6018733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43404 samples/s/p 4:32:06 } +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 287/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.6014444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43091 samples/s/p 4:32:13 } +2024-07-25 20:37:12,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 289/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.6010153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:12,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43957 samples/s/p 4:31:44 } +2024-07-25 20:37:15,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 291/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.600586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.42994 samples/s/p 4:32:10 } +2024-07-25 20:37:18,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 293/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.6001566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43262 samples/s/p 4:31:59 } +2024-07-25 20:37:21,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 295/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.599727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:21,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43560 samples/s/p 4:31:47 } +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 297/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.5992971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43520 samples/s/p 4:31:45 } +2024-07-25 20:37:27,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 299/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.5988671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:27,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43738 samples/s/p 4:31:36 } +2024-07-25 20:37:30,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 301/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5984367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:30,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43611 samples/s/p 4:31:36 } +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 303/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.5980064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43245 samples/s/p 4:31:44 } +2024-07-25 20:37:36,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 305/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.5975756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:36,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43583 samples/s/p 4:31:31 } +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 307/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 2.5971449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43032 samples/s/p 4:31:45 } +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 309/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.596714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43649 samples/s/p 4:31:24 } +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 311/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.5962827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43945 samples/s/p 4:31:12 } +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 313/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.5958512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43583 samples/s/p 4:31:20 } +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 315/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.5954198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43425 samples/s/p 4:31:21 } +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 317/ 1625], loss: 0.957, per_step_time: 1472ms, lr: 2.594988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43476 samples/s/p 4:31:17 } +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 319/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.594556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43670 samples/s/p 4:31:08 } +2024-07-25 20:37:59,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 321/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 2.594124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:59,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43021 samples/s/p 4:31:25 } +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 323/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 2.5936914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.44052 samples/s/p 4:30:51 } +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 325/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.5932592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43682 samples/s/p 4:30:59 } +2024-07-25 20:38:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 327/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5928262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:08,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44196 samples/s/p 4:30:41 } +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 329/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.5923935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43250 samples/s/p 4:31:06 } +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 331/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.5919602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43809 samples/s/p 4:30:46 } +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 333/ 1625], loss: 1.221, per_step_time: 1469ms, lr: 2.591527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44392 samples/s/p 4:30:26 } +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 335/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.5910935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43360 samples/s/p 4:30:54 } +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 337/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.5906598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43641 samples/s/p 4:30:43 } +2024-07-25 20:38:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 339/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.5902258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43625 samples/s/p 4:30:40 } +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 341/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 2.5897916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43080 samples/s/p 4:30:53 } +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 343/ 1625], loss: 0.974, per_step_time: 1470ms, lr: 2.5893574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43958 samples/s/p 4:30:24 } +2024-07-25 20:38:35,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 345/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 2.5889229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:35,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43418 samples/s/p 4:30:37 } +2024-07-25 20:38:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 347/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 2.5884883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:38,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43376 samples/s/p 4:30:36 } +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 349/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 2.5880534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.42967 samples/s/p 4:30:45 } +2024-07-25 20:38:44,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 351/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5876187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43551 samples/s/p 4:30:25 } +2024-07-25 20:38:47,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 353/ 1625], loss: 1.186, per_step_time: 1475ms, lr: 2.5871832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:47,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.42199 samples/s/p 4:31:02 } +2024-07-25 20:38:50,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 355/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.5867479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:50,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43333 samples/s/p 4:30:25 } +2024-07-25 20:38:53,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 357/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5863124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:53,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43965 samples/s/p 4:30:03 } +2024-07-25 20:38:55,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 359/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.5858766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:55,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43725 samples/s/p 4:30:08 } +2024-07-25 20:38:58,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 361/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5854404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:58,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43549 samples/s/p 4:30:10 } +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 363/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.5850044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43532 samples/s/p 4:30:08 } +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 365/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.5845678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43669 samples/s/p 4:30:01 } +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.5841315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43659 samples/s/p 4:29:58 } +2024-07-25 20:39:10,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 369/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.5836945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:10,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44364 samples/s/p 4:29:34 } +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 371/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.5832576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43345 samples/s/p 4:30:01 } +2024-07-25 20:39:16,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 373/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5828205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:16,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43326 samples/s/p 4:29:59 } +2024-07-25 20:39:19,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 375/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.5823832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:19,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43272 samples/s/p 4:29:58 } +2024-07-25 20:39:22,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 377/ 1625], loss: 0.949, per_step_time: 1468ms, lr: 2.5819456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:22,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44595 samples/s/p 4:29:15 } +2024-07-25 20:39:25,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 379/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.581508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43066 samples/s/p 4:29:58 } +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 381/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.58107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43584 samples/s/p 4:29:40 } +2024-07-25 20:39:31,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 383/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.580632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:31,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43212 samples/s/p 4:29:48 } +2024-07-25 20:39:34,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 385/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5801935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:34,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44031 samples/s/p 4:29:20 } +2024-07-25 20:39:37,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 387/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.5797552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:37,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44149 samples/s/p 4:29:14 } +2024-07-25 20:39:40,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 389/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.5793164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:40,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.42240 samples/s/p 4:30:08 } +2024-07-25 20:39:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 391/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.5788773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:43,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43364 samples/s/p 4:29:31 } +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 393/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.5784384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43508 samples/s/p 4:29:24 } +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 395/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.5779993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43231 samples/s/p 4:29:29 } +2024-07-25 20:39:52,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 397/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.5775596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43290 samples/s/p 4:29:25 } +2024-07-25 20:39:55,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 399/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.5771202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:55,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43340 samples/s/p 4:29:20 } +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 401/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5766803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43135 samples/s/p 4:29:23 } +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 403/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.5762403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43283 samples/s/p 4:29:16 } +2024-07-25 20:40:03,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 405/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.5758001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43674 samples/s/p 4:29:02 } +2024-07-25 20:40:06,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 407/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 2.57536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42996 samples/s/p 4:29:19 } +2024-07-25 20:40:09,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 409/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.5749192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43705 samples/s/p 4:28:55 } +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 411/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.5744786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43767 samples/s/p 4:28:50 } +2024-07-25 20:40:15,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 413/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.5740377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42865 samples/s/p 4:29:14 } +2024-07-25 20:40:18,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 415/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.5735966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43772 samples/s/p 4:28:44 } +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 417/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 2.5731553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:21,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43677 samples/s/p 4:28:44 } +2024-07-25 20:40:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 419/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.5727139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:24,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43851 samples/s/p 4:28:36 } +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 421/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.572272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43318 samples/s/p 4:28:49 } +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 423/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.5718302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43130 samples/s/p 4:28:51 } +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 425/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.571388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43537 samples/s/p 4:28:36 } +2024-07-25 20:40:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 427/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.5709458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.42999 samples/s/p 4:28:49 } +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 429/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.5705032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43607 samples/s/p 4:28:28 } +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 431/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.5700607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.42686 samples/s/p 4:28:53 } +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 433/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.5696178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43642 samples/s/p 4:28:21 } +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 435/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.5691748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43212 samples/s/p 4:28:31 } +2024-07-25 20:40:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 437/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.5687315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43359 samples/s/p 4:28:24 } +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 439/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.5682884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43463 samples/s/p 4:28:18 } +2024-07-25 20:40:56,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 441/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.5678448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43950 samples/s/p 4:28:00 } +2024-07-25 20:40:59,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 443/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.5674008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43832 samples/s/p 4:28:01 } +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 445/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.5669571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43228 samples/s/p 4:28:16 } +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 447/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.5665127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43588 samples/s/p 4:28:02 } +2024-07-25 20:41:08,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 449/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.5660685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43939 samples/s/p 4:27:49 } +2024-07-25 20:41:11,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 451/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.565624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:11,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43314 samples/s/p 4:28:04 } +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 453/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.5651794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43854 samples/s/p 4:27:46 } +2024-07-25 20:41:17,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 455/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 2.5647345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43499 samples/s/p 4:27:53 } +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 457/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.5642892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43224 samples/s/p 4:27:58 } +2024-07-25 20:41:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 459/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.563844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43717 samples/s/p 4:27:41 } +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 461/ 1625], loss: 1.362, per_step_time: 1472ms, lr: 2.5633986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43332 samples/s/p 4:27:49 } +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 463/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.562953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43687 samples/s/p 4:27:36 } +2024-07-25 20:41:32,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 465/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 2.5625071e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:32,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43993 samples/s/p 4:27:24 } +2024-07-25 20:41:35,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 467/ 1625], loss: 1.282, per_step_time: 1469ms, lr: 2.5620611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.44302 samples/s/p 4:27:12 } +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 469/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.561615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43053 samples/s/p 4:27:46 } +2024-07-25 20:41:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 471/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.5611685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43524 samples/s/p 4:27:29 } +2024-07-25 20:41:44,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 473/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.5607218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:44,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43496 samples/s/p 4:27:27 } +2024-07-25 20:41:47,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 475/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.560275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43210 samples/s/p 4:27:32 } +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 477/ 1625], loss: 0.968, per_step_time: 1471ms, lr: 2.5598283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43773 samples/s/p 4:27:13 } +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 479/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.559381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43300 samples/s/p 4:27:24 } +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 481/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 2.5589337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43285 samples/s/p 4:27:21 } +2024-07-25 20:41:58,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 483/ 1625], loss: 0.845, per_step_time: 1471ms, lr: 2.5584863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43521 samples/s/p 4:27:11 } +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 485/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 2.5580384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43396 samples/s/p 4:27:12 } +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 487/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.5575904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43695 samples/s/p 4:27:00 } +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 489/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.5571424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43435 samples/s/p 4:27:05 } +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 491/ 1625], loss: 0.914, per_step_time: 1471ms, lr: 2.5566942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43796 samples/s/p 4:26:51 } +2024-07-25 20:42:13,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 493/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.5562456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:13,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43606 samples/s/p 4:26:54 } +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 495/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.5557973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43381 samples/s/p 4:26:58 } +2024-07-25 20:42:19,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 497/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 2.5553481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:19,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.44070 samples/s/p 4:26:35 } +2024-07-25 20:42:22,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 499/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 2.5548994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43896 samples/s/p 4:26:37 } +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 501/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.5544505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43445 samples/s/p 4:26:47 } +2024-07-25 20:42:28,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 503/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.554001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:28,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43944 samples/s/p 4:26:29 } +2024-07-25 20:42:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 505/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.5535512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43251 samples/s/p 4:26:47 } +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 507/ 1625], loss: 1.000, per_step_time: 1473ms, lr: 2.5531017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.42955 samples/s/p 4:26:53 } +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 509/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.5526517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43201 samples/s/p 4:26:42 } +2024-07-25 20:42:40,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 511/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.5522017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:40,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43520 samples/s/p 4:26:30 } +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 513/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.5517515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43421 samples/s/p 4:26:30 } +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 515/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.5513009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43848 samples/s/p 4:26:15 } +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 517/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.5508501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43337 samples/s/p 4:26:27 } +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 519/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.5503994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43483 samples/s/p 4:26:19 } +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 521/ 1625], loss: 1.062, per_step_time: 1483ms, lr: 2.5499483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.39334 samples/s/p 4:28:19 } +2024-07-25 20:42:57,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 523/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.5494972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:57,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43367 samples/s/p 4:26:17 } +2024-07-25 20:43:00,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 525/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.5490457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:00,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43301 samples/s/p 4:26:16 } +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 527/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 2.548594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.42993 samples/s/p 4:26:22 } +2024-07-25 20:43:06,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 529/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.5481426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43884 samples/s/p 4:25:53 } +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 531/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.5476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43818 samples/s/p 4:25:52 } +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 533/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.5472384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43647 samples/s/p 4:25:54 } +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 535/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.5467862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43973 samples/s/p 4:25:41 } +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 537/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.5463336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43603 samples/s/p 4:25:49 } +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 539/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.5458809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43621 samples/s/p 4:25:46 } +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 541/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.545428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43356 samples/s/p 4:25:51 } +2024-07-25 20:43:27,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 543/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.544975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43911 samples/s/p 4:25:32 } +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 545/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 2.5445217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42828 samples/s/p 4:26:00 } +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 547/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.5440682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43283 samples/s/p 4:25:44 } +2024-07-25 20:43:36,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 549/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.5436146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42996 samples/s/p 4:25:50 } +2024-07-25 20:43:39,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 551/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.543161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43588 samples/s/p 4:25:29 } +2024-07-25 20:43:42,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 553/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5427067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43105 samples/s/p 4:25:40 } +2024-07-25 20:43:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 555/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.5422527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43785 samples/s/p 4:25:18 } +2024-07-25 20:43:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 557/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.5417983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43470 samples/s/p 4:25:24 } +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 559/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.5413437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43018 samples/s/p 4:25:34 } +2024-07-25 20:43:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 561/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 2.540889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:54,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44331 samples/s/p 4:24:53 } +2024-07-25 20:43:57,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 563/ 1625], loss: 1.052, per_step_time: 1474ms, lr: 2.540434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:57,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42671 samples/s/p 4:25:38 } +2024-07-25 20:43:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 565/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.5399791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:59,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43565 samples/s/p 4:25:09 } +2024-07-25 20:44:02,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 567/ 1625], loss: 1.009, per_step_time: 1473ms, lr: 2.5395238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42916 samples/s/p 4:25:25 } +2024-07-25 20:44:05,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 569/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.5390684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43428 samples/s/p 4:25:07 } +2024-07-25 20:44:08,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 571/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.5386127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44031 samples/s/p 4:24:47 } +2024-07-25 20:44:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 573/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.5381569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:11,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43550 samples/s/p 4:24:58 } +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 575/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.5377009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43329 samples/s/p 4:25:01 } +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 577/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.5372448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:17,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43781 samples/s/p 4:24:45 } +2024-07-25 20:44:20,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 579/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.5367885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:20,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.44026 samples/s/p 4:24:35 } +2024-07-25 20:44:23,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 581/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.5363319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:23,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43516 samples/s/p 4:24:47 } +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 583/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.5358753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43380 samples/s/p 4:24:48 } +2024-07-25 20:44:29,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 585/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.5354186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:29,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43525 samples/s/p 4:24:41 } +2024-07-25 20:44:32,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 587/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.5349613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:32,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43255 samples/s/p 4:24:46 } +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 589/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5345042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43239 samples/s/p 4:24:43 } +2024-07-25 20:44:38,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 591/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5340469e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43123 samples/s/p 4:24:44 } +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 593/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.533589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43022 samples/s/p 4:24:44 } +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 595/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.5331314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43162 samples/s/p 4:24:37 } +2024-07-25 20:44:47,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 597/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5326734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:47,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43990 samples/s/p 4:24:10 } +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 599/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5322151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43334 samples/s/p 4:24:26 } +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 601/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.5317566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43986 samples/s/p 4:24:04 } +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 603/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.531298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43977 samples/s/p 4:24:01 } +2024-07-25 20:44:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 605/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.5308394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:58,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43441 samples/s/p 4:24:14 } +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 607/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.5303805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43691 samples/s/p 4:24:04 } +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 609/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.5299214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43857 samples/s/p 4:23:56 } +2024-07-25 20:45:07,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 611/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.5294623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:07,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43536 samples/s/p 4:24:02 } +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 613/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.5290028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43274 samples/s/p 4:24:07 } +2024-07-25 20:45:13,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 615/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 2.5285432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43852 samples/s/p 4:23:47 } +2024-07-25 20:45:16,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 617/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.5280837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44008 samples/s/p 4:23:40 } +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.5276235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43558 samples/s/p 4:23:50 } +2024-07-25 20:45:22,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 621/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.527163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:22,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44039 samples/s/p 4:23:33 } +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 623/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.526703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44262 samples/s/p 4:23:24 } +2024-07-25 20:45:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 625/ 1625], loss: 1.311, per_step_time: 1469ms, lr: 2.5262425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44511 samples/s/p 4:23:13 } +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 627/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.525782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43734 samples/s/p 4:23:33 } +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 629/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.525321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42771 samples/s/p 4:23:58 } +2024-07-25 20:45:37,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 631/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.52486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:37,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43505 samples/s/p 4:23:34 } +2024-07-25 20:45:40,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 633/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 2.5243986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43011 samples/s/p 4:23:45 } +2024-07-25 20:45:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 635/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.5239373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43867 samples/s/p 4:23:17 } +2024-07-25 20:45:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 637/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 2.5234756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43870 samples/s/p 4:23:14 } +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 639/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.523014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.44078 samples/s/p 4:23:05 } +2024-07-25 20:45:52,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 641/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 2.522552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42614 samples/s/p 4:23:45 } +2024-07-25 20:45:55,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 643/ 1625], loss: 0.997, per_step_time: 1473ms, lr: 2.5220897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.42956 samples/s/p 4:23:32 } +2024-07-25 20:45:57,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 645/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.5216274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43053 samples/s/p 4:23:26 } +2024-07-25 20:46:00,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 647/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.521165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:00,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43335 samples/s/p 4:23:15 } +2024-07-25 20:46:03,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 649/ 1625], loss: 1.322, per_step_time: 1472ms, lr: 2.5207022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43254 samples/s/p 4:23:15 } +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 651/ 1625], loss: 1.077, per_step_time: 1470ms, lr: 2.5202393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.43937 samples/s/p 4:22:52 } +2024-07-25 20:46:09,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 653/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.5197764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.42981 samples/s/p 4:23:17 } +2024-07-25 20:46:12,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 655/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 2.519313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44004 samples/s/p 4:22:44 } +2024-07-25 20:46:15,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 657/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.5188498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:15,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44125 samples/s/p 4:22:38 } +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 659/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.5183861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43441 samples/s/p 4:22:55 } +2024-07-25 20:46:21,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 661/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5179223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43556 samples/s/p 4:22:48 } +2024-07-25 20:46:24,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 663/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.5174584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43846 samples/s/p 4:22:37 } +2024-07-25 20:46:27,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 665/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.5169942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.44047 samples/s/p 4:22:28 } +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 667/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.51653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43627 samples/s/p 4:22:37 } +2024-07-25 20:46:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 669/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.5160656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:33,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43050 samples/s/p 4:22:51 } +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 671/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.5156009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.42775 samples/s/p 4:22:56 } +2024-07-25 20:46:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 673/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.5151363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43356 samples/s/p 4:22:36 } +2024-07-25 20:46:42,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 675/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.5146714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43949 samples/s/p 4:22:16 } +2024-07-25 20:46:45,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 677/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.514206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:45,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43794 samples/s/p 4:22:18 } +2024-07-25 20:46:48,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 679/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.5137408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:48,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42897 samples/s/p 4:22:41 } +2024-07-25 20:46:51,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 681/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.5132751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:51,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43737 samples/s/p 4:22:14 } +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 683/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.5128094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42864 samples/s/p 4:22:36 } +2024-07-25 20:46:56,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 685/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.5123436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:56,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43222 samples/s/p 4:22:23 } +2024-07-25 20:46:59,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 687/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.5118774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:59,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43209 samples/s/p 4:22:20 } +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 689/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.5114114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43921 samples/s/p 4:21:56 } +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 691/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.510945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43478 samples/s/p 4:22:06 } +2024-07-25 20:47:08,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 693/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.5104782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:08,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43508 samples/s/p 4:22:03 } +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 695/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.5100115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43136 samples/s/p 4:22:10 } +2024-07-25 20:47:14,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 697/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.5095445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:14,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43623 samples/s/p 4:21:53 } +2024-07-25 20:47:17,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 699/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.5090774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43605 samples/s/p 4:21:51 } +2024-07-25 20:47:20,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 701/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.50861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:20,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43532 samples/s/p 4:21:50 } +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 703/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.5081426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43895 samples/s/p 4:21:37 } +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 705/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.5076748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43696 samples/s/p 4:21:39 } +2024-07-25 20:47:29,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 707/ 1625], loss: 0.862, per_step_time: 1472ms, lr: 2.5072073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43214 samples/s/p 4:21:50 } +2024-07-25 20:47:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 709/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.5067391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42685 samples/s/p 4:22:03 } +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 711/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 2.506271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43914 samples/s/p 4:21:24 } +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 713/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.5058027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42896 samples/s/p 4:21:51 } +2024-07-25 20:47:41,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 715/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.5053341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:41,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43411 samples/s/p 4:21:33 } +2024-07-25 20:47:44,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 717/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.5048654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:44,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43736 samples/s/p 4:21:21 } +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 719/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5043966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42924 samples/s/p 4:21:41 } +2024-07-25 20:47:50,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 721/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.5039275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43218 samples/s/p 4:21:30 } +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 723/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5034584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43192 samples/s/p 4:21:27 } +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 725/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.5029889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.42904 samples/s/p 4:21:33 } +2024-07-25 20:47:56,025 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 727/ 1625], loss: 1.002, per_step_time: 2754ms, lr: 2.5025192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 2.90428 samples/s/p 8:08:50 } +2024-07-25 20:48:34,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 729/ 1625], loss: 0.904, per_step_time: 1472ms, lr: 2.5020494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:34,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43430 samples/s/p 4:21:12 } +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 731/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 2.5015794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.44068 samples/s/p 4:20:50 } +2024-07-25 20:48:40,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 733/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.5011092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43563 samples/s/p 4:21:02 } +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 735/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.5006391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43566 samples/s/p 4:20:59 } +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 737/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.5001686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43488 samples/s/p 4:20:58 } +2024-07-25 20:48:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 739/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.4996976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:48,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43594 samples/s/p 4:20:52 } +2024-07-25 20:48:51,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 741/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.499227e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:51,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43314 samples/s/p 4:20:57 } +2024-07-25 20:48:54,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 743/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 2.498756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:54,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43969 samples/s/p 4:20:36 } +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 745/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.4982848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:57,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43162 samples/s/p 4:20:56 } +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 747/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 2.4978135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43911 samples/s/p 4:20:31 } +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 749/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.4973418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43674 samples/s/p 4:20:35 } +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 751/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4968702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43808 samples/s/p 4:20:29 } +2024-07-25 20:49:09,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 753/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.4963983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43007 samples/s/p 4:20:49 } +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 755/ 1625], loss: 0.919, per_step_time: 1471ms, lr: 2.4959261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43620 samples/s/p 4:20:28 } +2024-07-25 20:49:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 757/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.495454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:15,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.42827 samples/s/p 4:20:48 } +2024-07-25 20:49:18,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 759/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.4949815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43737 samples/s/p 4:20:19 } +2024-07-25 20:49:21,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 761/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.4945093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:21,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44102 samples/s/p 4:20:05 } +2024-07-25 20:49:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 763/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4940364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:25,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43694 samples/s/p 4:20:14 } +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 765/ 1625], loss: 1.161, per_step_time: 1468ms, lr: 2.4935633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44601 samples/s/p 4:19:45 } +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 767/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.4930905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43618 samples/s/p 4:20:10 } +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 769/ 1625], loss: 1.214, per_step_time: 1470ms, lr: 2.4926172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44069 samples/s/p 4:19:55 } +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 771/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.4921437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43418 samples/s/p 4:20:10 } +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 773/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.49167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43519 samples/s/p 4:20:04 } +2024-07-25 20:49:42,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 775/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.4911962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:42,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43318 samples/s/p 4:20:07 } +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 777/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.4907225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43767 samples/s/p 4:19:51 } +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 779/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.4902482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43581 samples/s/p 4:19:54 } +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 781/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.4897738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43625 samples/s/p 4:19:50 } +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 783/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.4892994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43646 samples/s/p 4:19:46 } +2024-07-25 20:49:57,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 785/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.4888246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:57,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43886 samples/s/p 4:19:36 } +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 787/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.4883499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43046 samples/s/p 4:19:57 } +2024-07-25 20:50:03,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 789/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 2.4878751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:03,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44080 samples/s/p 4:19:25 } +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 791/ 1625], loss: 1.425, per_step_time: 1471ms, lr: 2.4873994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43748 samples/s/p 4:19:31 } +2024-07-25 20:50:09,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 793/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4869241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:09,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.42861 samples/s/p 4:19:54 } +2024-07-25 20:50:12,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 795/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.486449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:12,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43785 samples/s/p 4:19:24 } +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 797/ 1625], loss: 1.012, per_step_time: 1863ms, lr: 2.4859732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 4.29254 samples/s/p 5:28:34 } +2024-07-25 20:50:18,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 799/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.4854971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:18,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44231 samples/s/p 4:19:06 } +2024-07-25 20:50:21,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 801/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 2.4850215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:21,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43526 samples/s/p 4:19:23 } +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 803/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.484545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43336 samples/s/p 4:19:26 } +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 805/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.4840687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43781 samples/s/p 4:19:10 } +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 807/ 1625], loss: 1.324, per_step_time: 1474ms, lr: 2.4835923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42524 samples/s/p 4:19:43 } +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 809/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 2.4831155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42973 samples/s/p 4:19:27 } +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 811/ 1625], loss: 1.159, per_step_time: 1474ms, lr: 2.4826384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42720 samples/s/p 4:19:31 } +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 813/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4821613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42763 samples/s/p 4:19:27 } +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 815/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.4816842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43655 samples/s/p 4:18:59 } +2024-07-25 20:50:45,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 817/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.4812067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:45,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42832 samples/s/p 4:19:19 } +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 819/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.480729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43352 samples/s/p 4:19:02 } +2024-07-25 20:50:51,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 821/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.4802514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:51,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43583 samples/s/p 4:18:52 } +2024-07-25 20:50:54,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 823/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 2.4797733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:54,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43812 samples/s/p 4:18:43 } +2024-07-25 20:50:57,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 825/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 2.4792951e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:57,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43085 samples/s/p 4:19:00 } +2024-07-25 20:51:00,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 827/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.478817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:00,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43853 samples/s/p 4:18:35 } +2024-07-25 20:51:03,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 829/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 2.4783385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:03,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.42939 samples/s/p 4:18:59 } +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 831/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.4778597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43301 samples/s/p 4:18:45 } +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 833/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.477381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43117 samples/s/p 4:18:48 } +2024-07-25 20:51:12,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 835/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 2.476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43164 samples/s/p 4:18:43 } +2024-07-25 20:51:15,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 837/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.476423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42540 samples/s/p 4:18:58 } +2024-07-25 20:51:18,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 839/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 2.4759434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:18,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43835 samples/s/p 4:18:18 } +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 841/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.4754641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:20,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43509 samples/s/p 4:18:25 } +2024-07-25 20:51:23,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 843/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.4749845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:23,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43691 samples/s/p 4:18:17 } +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 845/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.474505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43167 samples/s/p 4:18:29 } +2024-07-25 20:51:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 847/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.4740246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43571 samples/s/p 4:18:14 } +2024-07-25 20:51:32,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 849/ 1625], loss: 1.202, per_step_time: 1469ms, lr: 2.4735444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:32,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.44221 samples/s/p 4:17:53 } +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 851/ 1625], loss: 1.151, per_step_time: 1474ms, lr: 2.4730645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42610 samples/s/p 4:18:36 } +2024-07-25 20:51:38,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 853/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.472584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:38,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42996 samples/s/p 4:18:22 } +2024-07-25 20:51:41,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 855/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 2.472103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43831 samples/s/p 4:17:55 } +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 857/ 1625], loss: 1.369, per_step_time: 1470ms, lr: 2.4716222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43903 samples/s/p 4:17:50 } +2024-07-25 20:51:47,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 859/ 1625], loss: 1.313, per_step_time: 1470ms, lr: 2.4711413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43942 samples/s/p 4:17:46 } +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 861/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.47066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43582 samples/s/p 4:17:53 } +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 863/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.4701789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43473 samples/s/p 4:17:53 } +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 865/ 1625], loss: 1.142, per_step_time: 1477ms, lr: 2.4696972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.41605 samples/s/p 4:18:44 } +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 867/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 2.4692155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43670 samples/s/p 4:17:42 } +2024-07-25 20:52:02,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 869/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.4687335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43522 samples/s/p 4:17:43 } +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 871/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.4682515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43162 samples/s/p 4:17:50 } +2024-07-25 20:52:08,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 873/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 2.4677693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:08,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43023 samples/s/p 4:17:51 } +2024-07-25 20:52:11,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 875/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.467287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:11,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43255 samples/s/p 4:17:42 } +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 877/ 1625], loss: 1.386, per_step_time: 1473ms, lr: 2.4668043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43010 samples/s/p 4:17:46 } +2024-07-25 20:52:17,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 879/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.4663217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43080 samples/s/p 4:17:41 } +2024-07-25 20:52:19,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 881/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.4658388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:19,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.44166 samples/s/p 4:17:07 } +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 883/ 1625], loss: 1.088, per_step_time: 1475ms, lr: 2.4653558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:22,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42223 samples/s/p 4:17:59 } +2024-07-25 20:52:25,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 885/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 2.4648729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43817 samples/s/p 4:17:11 } +2024-07-25 20:52:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 887/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.4643892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:28,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43093 samples/s/p 4:17:29 } +2024-07-25 20:52:31,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 889/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.463906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:31,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42913 samples/s/p 4:17:31 } +2024-07-25 20:52:34,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 891/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.4634222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:34,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43720 samples/s/p 4:17:05 } +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 893/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.4629384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.44015 samples/s/p 4:16:54 } +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 895/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.4624542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43721 samples/s/p 4:16:59 } +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 897/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.46197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42913 samples/s/p 4:17:19 } +2024-07-25 20:52:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 899/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.4614856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43317 samples/s/p 4:17:05 } +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 901/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.461001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43264 samples/s/p 4:17:03 } +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 903/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 2.4605162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43114 samples/s/p 4:17:05 } +2024-07-25 20:52:55,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 905/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.4600313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:55,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43237 samples/s/p 4:16:58 } +2024-07-25 20:52:58,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 907/ 1625], loss: 1.172, per_step_time: 1483ms, lr: 2.4595463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.39167 samples/s/p 4:18:52 } +2024-07-25 20:53:01,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 909/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.4590609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:01,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43534 samples/s/p 4:16:44 } +2024-07-25 20:53:04,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 911/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.4585755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.42994 samples/s/p 4:16:56 } +2024-07-25 20:53:07,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 913/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.45809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:07,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43334 samples/s/p 4:16:44 } +2024-07-25 20:53:10,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 915/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.4576042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43587 samples/s/p 4:16:34 } +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 917/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.4571184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43199 samples/s/p 4:16:42 } +2024-07-25 20:53:16,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 919/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.4566321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:16,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43113 samples/s/p 4:16:41 } +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 921/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.456146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43358 samples/s/p 4:16:31 } +2024-07-25 20:53:22,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 923/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.4556595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:22,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43682 samples/s/p 4:16:19 } +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 925/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4551731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43554 samples/s/p 4:16:20 } +2024-07-25 20:53:27,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 927/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.4546864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:27,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43822 samples/s/p 4:16:09 } +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 929/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.4541992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43893 samples/s/p 4:16:04 } +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 931/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.4537121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.44235 samples/s/p 4:15:52 } +2024-07-25 20:53:36,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 933/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.453225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:36,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43788 samples/s/p 4:16:01 } +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 935/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.4527375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:39,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43487 samples/s/p 4:16:07 } +2024-07-25 20:53:42,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 937/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.45225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43309 samples/s/p 4:16:09 } +2024-07-25 20:53:45,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 939/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4517623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:45,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43296 samples/s/p 4:16:06 } +2024-07-25 20:53:48,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 941/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.4512745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:48,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43659 samples/s/p 4:15:53 } +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 943/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.450786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.44084 samples/s/p 4:15:38 } +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 945/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4502982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43233 samples/s/p 4:15:59 } +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 947/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.4498098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43859 samples/s/p 4:15:39 } +2024-07-25 20:54:00,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 949/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.449321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:00,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43314 samples/s/p 4:15:51 } +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 951/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.4488325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43083 samples/s/p 4:15:55 } +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 953/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.4483435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43500 samples/s/p 4:15:40 } +2024-07-25 20:54:09,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 955/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.4478544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43292 samples/s/p 4:15:43 } +2024-07-25 20:54:12,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 957/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4473653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:12,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43741 samples/s/p 4:15:27 } +2024-07-25 20:54:15,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 959/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.4468758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:15,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43679 samples/s/p 4:15:26 } +2024-07-25 20:54:18,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 961/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.4463863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:18,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43337 samples/s/p 4:15:33 } +2024-07-25 20:54:21,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.4458963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:21,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43069 samples/s/p 4:15:38 } +2024-07-25 20:54:23,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 965/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.4454064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:23,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.42969 samples/s/p 4:15:37 } +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 967/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.4449166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42769 samples/s/p 4:15:40 } +2024-07-25 20:54:29,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 969/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.444426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:29,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43201 samples/s/p 4:15:25 } +2024-07-25 20:54:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 971/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.443936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:32,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43439 samples/s/p 4:15:15 } +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 973/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.4434456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42800 samples/s/p 4:15:30 } +2024-07-25 20:54:38,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 975/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.4429548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:38,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43749 samples/s/p 4:15:01 } +2024-07-25 20:54:41,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 977/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.4424635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44186 samples/s/p 4:14:45 } +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 979/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.4419727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43072 samples/s/p 4:15:14 } +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 981/ 1625], loss: 1.095, per_step_time: 1469ms, lr: 2.4414816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44337 samples/s/p 4:14:35 } +2024-07-25 20:54:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 983/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.4409901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:50,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43993 samples/s/p 4:14:42 } +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 985/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.4404984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43518 samples/s/p 4:14:52 } +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 987/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.440007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43570 samples/s/p 4:14:48 } +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 989/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.4395149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43512 samples/s/p 4:14:47 } +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 991/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.4390229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43670 samples/s/p 4:14:39 } +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 993/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.4385306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43641 samples/s/p 4:14:37 } +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 995/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.4380382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43227 samples/s/p 4:14:46 } +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 997/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4375458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:11,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43265 samples/s/p 4:14:42 } +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 999/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.437053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.42819 samples/s/p 4:14:52 } +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1001/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4365601e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43297 samples/s/p 4:14:35 } +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1003/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 2.4360672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43541 samples/s/p 4:14:25 } +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1005/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.4355739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43343 samples/s/p 4:14:28 } +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1007/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.4350806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43473 samples/s/p 4:14:21 } +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1009/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.434587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43123 samples/s/p 4:14:28 } +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1011/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 2.4340932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43902 samples/s/p 4:14:03 } +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1013/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.4335995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.42579 samples/s/p 4:14:38 } +2024-07-25 20:55:37,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1015/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.4331055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43514 samples/s/p 4:14:08 } +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1017/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.4326111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43587 samples/s/p 4:14:03 } +2024-07-25 20:55:43,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1019/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.432117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43204 samples/s/p 4:14:11 } +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1021/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.4316225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43168 samples/s/p 4:14:09 } +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1023/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.431128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:49,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43796 samples/s/p 4:13:49 } +2024-07-25 20:55:52,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1025/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.4306331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43623 samples/s/p 4:13:51 } +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1027/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 2.430138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43149 samples/s/p 4:14:01 } +2024-07-25 20:55:58,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1029/ 1625], loss: 1.533, per_step_time: 1472ms, lr: 2.4296429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:58,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43471 samples/s/p 4:13:49 } +2024-07-25 20:56:01,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1031/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.4291478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43659 samples/s/p 4:13:41 } +2024-07-25 20:56:04,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1033/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.428652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:04,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43523 samples/s/p 4:13:42 } +2024-07-25 20:56:07,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1035/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.4281568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43837 samples/s/p 4:13:30 } +2024-07-25 20:56:10,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1037/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.427661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43601 samples/s/p 4:13:34 } +2024-07-25 20:56:13,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1039/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.4271649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:13,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42773 samples/s/p 4:13:54 } +2024-07-25 20:56:16,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1041/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.4266688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42880 samples/s/p 4:13:48 } +2024-07-25 20:56:19,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1043/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 2.4261724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43511 samples/s/p 4:13:27 } +2024-07-25 20:56:22,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1045/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.425676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:22,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43969 samples/s/p 4:13:12 } +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1047/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.4251794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42820 samples/s/p 4:13:41 } +2024-07-25 20:56:27,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1049/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4246825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:27,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43943 samples/s/p 4:13:06 } +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1051/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.4241855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43142 samples/s/p 4:13:26 } +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1053/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 2.4236884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43531 samples/s/p 4:13:12 } +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1055/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.4231913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43556 samples/s/p 4:13:08 } +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1057/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.422694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43678 samples/s/p 4:13:02 } +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1059/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.4221965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43528 samples/s/p 4:13:03 } +2024-07-25 20:56:45,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1061/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.421699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:45,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43577 samples/s/p 4:12:59 } +2024-07-25 20:56:48,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1063/ 1625], loss: 1.396, per_step_time: 1470ms, lr: 2.421201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43916 samples/s/p 4:12:47 } +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1065/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4207025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43212 samples/s/p 4:13:03 } +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1067/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.4202047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43239 samples/s/p 4:13:00 } +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1069/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.4197063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43885 samples/s/p 4:12:39 } +2024-07-25 20:57:00,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1071/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.4192077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:00,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43747 samples/s/p 4:12:39 } +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1073/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 2.418709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43917 samples/s/p 4:12:32 } +2024-07-25 20:57:06,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1075/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.4182102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:06,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43195 samples/s/p 4:12:49 } +2024-07-25 20:57:09,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1077/ 1625], loss: 1.091, per_step_time: 1482ms, lr: 2.4177112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:09,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.39485 samples/s/p 4:14:30 } +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1079/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.417212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:12,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43321 samples/s/p 4:12:40 } +2024-07-25 20:57:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1081/ 1625], loss: 1.162, per_step_time: 1469ms, lr: 2.4167124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:15,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44289 samples/s/p 4:12:10 } +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1083/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4162131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43891 samples/s/p 4:12:18 } +2024-07-25 20:57:21,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1085/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.4157134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:21,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44117 samples/s/p 4:12:09 } +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1087/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.4152136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43818 samples/s/p 4:12:14 } +2024-07-25 20:57:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1089/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.4147135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43262 samples/s/p 4:12:27 } +2024-07-25 20:57:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1091/ 1625], loss: 0.914, per_step_time: 1473ms, lr: 2.4142133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43066 samples/s/p 4:12:29 } +2024-07-25 20:57:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1093/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.413713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43386 samples/s/p 4:12:17 } +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1095/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.4132125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43778 samples/s/p 4:12:03 } +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1097/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 2.412712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43444 samples/s/p 4:12:10 } +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1099/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.4122113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43348 samples/s/p 4:12:09 } +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1101/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.4117102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43976 samples/s/p 4:11:49 } +2024-07-25 20:57:47,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1103/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 2.4112092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:47,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43783 samples/s/p 4:11:51 } +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1105/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.410708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43003 samples/s/p 4:12:10 } +2024-07-25 20:57:53,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1107/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.4102066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.44060 samples/s/p 4:11:38 } +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1109/ 1625], loss: 1.166, per_step_time: 1475ms, lr: 2.409705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.42246 samples/s/p 4:12:25 } +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1111/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.4092036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43314 samples/s/p 4:11:53 } +2024-07-25 20:58:02,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1113/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.4087014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43716 samples/s/p 4:11:39 } +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1115/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.4081994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43613 samples/s/p 4:11:38 } +2024-07-25 20:58:08,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1117/ 1625], loss: 1.232, per_step_time: 1484ms, lr: 2.4076973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:08,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.39070 samples/s/p 4:13:43 } +2024-07-25 20:58:11,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1119/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.407195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.42997 samples/s/p 4:11:50 } +2024-07-25 20:58:14,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1121/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4066921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:14,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43306 samples/s/p 4:11:38 } +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1123/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 2.40619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43021 samples/s/p 4:11:43 } +2024-07-25 20:58:20,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1125/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.4056868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:20,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.42868 samples/s/p 4:11:44 } +2024-07-25 20:58:23,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1127/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.4051838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43539 samples/s/p 4:11:23 } +2024-07-25 20:58:26,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1129/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.4046809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:26,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.44102 samples/s/p 4:11:04 } +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1131/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.4041776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43702 samples/s/p 4:11:12 } +2024-07-25 20:58:31,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1133/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.4036739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43544 samples/s/p 4:11:14 } +2024-07-25 20:58:34,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1135/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.4031702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.44182 samples/s/p 4:10:53 } +2024-07-25 20:58:37,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1137/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4026664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:37,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43932 samples/s/p 4:10:57 } +2024-07-25 20:58:40,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1139/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.4021625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43938 samples/s/p 4:10:54 } +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1141/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.4016585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43772 samples/s/p 4:10:56 } +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1143/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.4011542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43333 samples/s/p 4:11:05 } +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1145/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.40065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43789 samples/s/p 4:10:49 } +2024-07-25 20:58:52,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1147/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.4001452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43192 samples/s/p 4:11:03 } +2024-07-25 20:58:55,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1149/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.3996405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:55,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43657 samples/s/p 4:10:47 } +2024-07-25 20:58:58,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1151/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.3991359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43094 samples/s/p 4:11:00 } +2024-07-25 20:59:01,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1153/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 2.3986307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.44018 samples/s/p 4:10:31 } +2024-07-25 20:59:04,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1155/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3981253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:04,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43356 samples/s/p 4:10:47 } +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1157/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.3976201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43291 samples/s/p 4:10:46 } +2024-07-25 20:59:10,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1159/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.3971146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43903 samples/s/p 4:10:26 } +2024-07-25 20:59:13,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1161/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 2.3966091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:13,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43096 samples/s/p 4:10:45 } +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1163/ 1625], loss: 0.920, per_step_time: 1473ms, lr: 2.396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.42835 samples/s/p 4:10:49 } +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1165/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.3955972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43549 samples/s/p 4:10:27 } +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1167/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.3950912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43675 samples/s/p 4:10:20 } +2024-07-25 20:59:25,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1169/ 1625], loss: 0.966, per_step_time: 1470ms, lr: 2.3945848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:25,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44067 samples/s/p 4:10:06 } +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1171/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.3940784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44115 samples/s/p 4:10:02 } +2024-07-25 20:59:30,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1173/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.3935718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43761 samples/s/p 4:10:09 } +2024-07-25 20:59:33,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1175/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.393065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43324 samples/s/p 4:10:18 } +2024-07-25 20:59:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1177/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.3925579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43795 samples/s/p 4:10:02 } +2024-07-25 20:59:39,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1179/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.392051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:39,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43490 samples/s/p 4:10:08 } +2024-07-25 20:59:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1181/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.3915436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:42,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43459 samples/s/p 4:10:06 } +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1183/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 2.3910365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42938 samples/s/p 4:10:17 } +2024-07-25 20:59:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1185/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.3905288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:48,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43755 samples/s/p 4:09:52 } +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1187/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.3900211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43929 samples/s/p 4:09:44 } +2024-07-25 20:59:54,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1189/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.3895132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43939 samples/s/p 4:09:41 } +2024-07-25 20:59:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1191/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.3890052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42764 samples/s/p 4:10:10 } +2024-07-25 21:00:00,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1193/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.3884972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43601 samples/s/p 4:09:44 } +2024-07-25 21:00:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1195/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.3879888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:03,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43828 samples/s/p 4:09:35 } +2024-07-25 21:00:06,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1197/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.3874802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43733 samples/s/p 4:09:34 } +2024-07-25 21:00:09,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1199/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.3869716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43676 samples/s/p 4:09:33 } +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1201/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.3864632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43167 samples/s/p 4:09:44 } +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1203/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3859538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43672 samples/s/p 4:09:27 } +2024-07-25 21:00:18,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1205/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.3854449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43575 samples/s/p 4:09:27 } +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1207/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.3849358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43327 samples/s/p 4:09:31 } +2024-07-25 21:00:24,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1209/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.3844266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43618 samples/s/p 4:09:20 } +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1211/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.3839166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43740 samples/s/p 4:09:14 } +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1213/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 2.3834073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43158 samples/s/p 4:09:27 } +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1215/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.3828976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43515 samples/s/p 4:09:14 } +2024-07-25 21:00:35,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1217/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.3823872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:35,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43438 samples/s/p 4:09:13 } +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1219/ 1625], loss: 1.324, per_step_time: 1470ms, lr: 2.3818773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.44016 samples/s/p 4:08:54 } +2024-07-25 21:00:41,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1221/ 1625], loss: 1.435, per_step_time: 1473ms, lr: 2.3813669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:41,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43054 samples/s/p 4:09:18 } +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1223/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.3808565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43863 samples/s/p 4:08:53 } +2024-07-25 21:00:47,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1225/ 1625], loss: 1.394, per_step_time: 1472ms, lr: 2.3803459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43352 samples/s/p 4:09:04 } +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1227/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.3798351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44192 samples/s/p 4:08:38 } +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1229/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.379324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43262 samples/s/p 4:09:00 } +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1231/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.378813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43500 samples/s/p 4:08:51 } +2024-07-25 21:00:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1233/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.3783017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43937 samples/s/p 4:08:36 } +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1235/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.3777904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43922 samples/s/p 4:08:33 } +2024-07-25 21:01:05,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1237/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.3772787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44038 samples/s/p 4:08:27 } +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1239/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.3767674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44192 samples/s/p 4:08:20 } +2024-07-25 21:01:11,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1241/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 2.3762554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:11,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43870 samples/s/p 4:08:26 } +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.3757435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43360 samples/s/p 4:08:37 } +2024-07-25 21:01:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3752315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:17,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42975 samples/s/p 4:08:45 } +2024-07-25 21:01:20,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1247/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 2.374719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42699 samples/s/p 4:08:49 } +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1249/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.3742066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43276 samples/s/p 4:08:31 } +2024-07-25 21:01:25,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1251/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.373694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:25,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44142 samples/s/p 4:08:04 } +2024-07-25 21:01:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1253/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 2.3731813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43420 samples/s/p 4:08:21 } +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1255/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 2.3726683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44391 samples/s/p 4:07:51 } +2024-07-25 21:01:34,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1257/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.3721554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43814 samples/s/p 4:08:04 } +2024-07-25 21:01:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1259/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.371642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43503 samples/s/p 4:08:10 } +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.3711285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43916 samples/s/p 4:07:55 } +2024-07-25 21:01:43,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1263/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.3706152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:43,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43233 samples/s/p 4:08:11 } +2024-07-25 21:01:46,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1265/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.3701015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:46,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43325 samples/s/p 4:08:06 } +2024-07-25 21:01:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1267/ 1625], loss: 1.050, per_step_time: 1474ms, lr: 2.3695877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.42471 samples/s/p 4:08:26 } +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1269/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.3690738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43331 samples/s/p 4:08:00 } +2024-07-25 21:01:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1271/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3685594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:55,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43376 samples/s/p 4:07:55 } +2024-07-25 21:01:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1273/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.3680452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:58,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43154 samples/s/p 4:07:59 } +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1275/ 1625], loss: 0.887, per_step_time: 1470ms, lr: 2.3675308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.44060 samples/s/p 4:07:31 } +2024-07-25 21:02:04,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1277/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.3670162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:04,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43061 samples/s/p 4:07:55 } +2024-07-25 21:02:07,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1279/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.3665016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:07,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43841 samples/s/p 4:07:31 } +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1281/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 2.3659866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43694 samples/s/p 4:07:32 } +2024-07-25 21:02:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1283/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.3654715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:13,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43394 samples/s/p 4:07:37 } +2024-07-25 21:02:16,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1285/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.3649563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43808 samples/s/p 4:07:23 } +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1287/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 2.364441e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43314 samples/s/p 4:07:34 } +2024-07-25 21:02:22,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1289/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.3639259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43578 samples/s/p 4:07:23 } +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1291/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.36341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43786 samples/s/p 4:07:15 } +2024-07-25 21:02:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1293/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.3628942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43985 samples/s/p 4:07:06 } +2024-07-25 21:02:30,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1295/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.3623785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43645 samples/s/p 4:07:13 } +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1297/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.3618622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43380 samples/s/p 4:07:17 } +2024-07-25 21:02:36,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1299/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.3613458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:36,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43522 samples/s/p 4:07:10 } +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1301/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.3608296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43178 samples/s/p 4:07:17 } +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1303/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.3603132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43269 samples/s/p 4:07:11 } +2024-07-25 21:02:45,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1305/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.3597966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43206 samples/s/p 4:07:10 } +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1307/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.3592798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:48,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.42773 samples/s/p 4:07:19 } +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1309/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.3587627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43462 samples/s/p 4:06:57 } +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1311/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.3582457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43323 samples/s/p 4:06:58 } +2024-07-25 21:02:57,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1313/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.3577282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43034 samples/s/p 4:07:03 } +2024-07-25 21:03:00,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.3572107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43639 samples/s/p 4:06:43 } +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1317/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3566932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43412 samples/s/p 4:06:47 } +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1319/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 2.3561757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.42887 samples/s/p 4:06:58 } +2024-07-25 21:03:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1321/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 2.3556577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:09,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43855 samples/s/p 4:06:29 } +2024-07-25 21:03:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1323/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.35514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:12,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43439 samples/s/p 4:06:37 } +2024-07-25 21:03:15,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1325/ 1625], loss: 0.985, per_step_time: 1472ms, lr: 2.3546214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:15,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43356 samples/s/p 4:06:36 } +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1327/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 2.3541032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.42394 samples/s/p 4:07:00 } +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1329/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.353585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43337 samples/s/p 4:06:31 } +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1331/ 1625], loss: 1.386, per_step_time: 1471ms, lr: 2.3530665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43798 samples/s/p 4:06:16 } +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1333/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.3525474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43872 samples/s/p 4:06:11 } +2024-07-25 21:03:29,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1335/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3520286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43342 samples/s/p 4:06:22 } +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1337/ 1625], loss: 1.373, per_step_time: 1471ms, lr: 2.3515096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43602 samples/s/p 4:06:12 } +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1339/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.3509905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43369 samples/s/p 4:06:15 } +2024-07-25 21:03:38,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1341/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.350471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43713 samples/s/p 4:06:03 } +2024-07-25 21:03:41,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1343/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3499517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43468 samples/s/p 4:06:07 } +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1345/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 2.3494318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.42348 samples/s/p 4:06:34 } +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1347/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.3489121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43941 samples/s/p 4:05:48 } +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1349/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.348392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43164 samples/s/p 4:06:06 } +2024-07-25 21:03:53,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1351/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.347872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43391 samples/s/p 4:05:57 } +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1353/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.3473518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.44018 samples/s/p 4:05:37 } +2024-07-25 21:03:59,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1355/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 2.3468312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43192 samples/s/p 4:05:57 } +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1357/ 1625], loss: 1.483, per_step_time: 1472ms, lr: 2.346311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43464 samples/s/p 4:05:46 } +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1359/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3457902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43383 samples/s/p 4:05:46 } +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1361/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.3452694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43648 samples/s/p 4:05:36 } +2024-07-25 21:04:11,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1363/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.3447485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43557 samples/s/p 4:05:35 } +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1365/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.3442273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43545 samples/s/p 4:05:32 } +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1367/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.343706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43176 samples/s/p 4:05:39 } +2024-07-25 21:04:20,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1369/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.3431845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:20,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.42840 samples/s/p 4:05:46 } +2024-07-25 21:04:23,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1371/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.342663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43279 samples/s/p 4:05:31 } +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1373/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.3421413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:26,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43140 samples/s/p 4:05:32 } +2024-07-25 21:04:28,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1375/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 2.3416194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:28,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42781 samples/s/p 4:05:38 } +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1377/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.3410974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43950 samples/s/p 4:05:04 } +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1379/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 2.3405755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42681 samples/s/p 4:05:35 } +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1381/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.340053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43884 samples/s/p 4:05:00 } +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1383/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.3395305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43582 samples/s/p 4:05:05 } +2024-07-25 21:04:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1385/ 1625], loss: 1.235, per_step_time: 1470ms, lr: 2.3390083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43933 samples/s/p 4:04:52 } +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1387/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.3384853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43937 samples/s/p 4:04:49 } +2024-07-25 21:04:49,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1389/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.3379625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:49,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43050 samples/s/p 4:05:10 } +2024-07-25 21:04:52,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1391/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.3374394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:52,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43649 samples/s/p 4:04:51 } +2024-07-25 21:04:55,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1393/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.3369164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43644 samples/s/p 4:04:49 } +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1395/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.336393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43056 samples/s/p 4:05:01 } +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1397/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.3358696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43239 samples/s/p 4:04:54 } +2024-07-25 21:05:04,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1399/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.3353461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:04,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43571 samples/s/p 4:04:42 } +2024-07-25 21:05:07,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1401/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.334822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43065 samples/s/p 4:04:52 } +2024-07-25 21:05:10,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1403/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.3342984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:10,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42724 samples/s/p 4:04:59 } +2024-07-25 21:05:13,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1405/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.3337743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:13,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43088 samples/s/p 4:04:46 } +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1407/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.3332504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43185 samples/s/p 4:04:40 } +2024-07-25 21:05:19,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1409/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.3327257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43292 samples/s/p 4:04:34 } +2024-07-25 21:05:22,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1411/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.3322013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43618 samples/s/p 4:04:23 } +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1413/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.3316768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43210 samples/s/p 4:04:31 } +2024-07-25 21:05:28,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1415/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 2.3311522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44108 samples/s/p 4:04:04 } +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1417/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.3306273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43232 samples/s/p 4:04:24 } +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1419/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.3301021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44016 samples/s/p 4:04:00 } +2024-07-25 21:05:36,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1421/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.329577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:36,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43128 samples/s/p 4:04:21 } +2024-07-25 21:05:39,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1423/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.3290517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:39,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43798 samples/s/p 4:04:00 } +2024-07-25 21:05:42,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1425/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.3285264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43811 samples/s/p 4:03:57 } +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1427/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 2.3280007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:45,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.42972 samples/s/p 4:04:17 } +2024-07-25 21:05:48,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1429/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.3274748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43512 samples/s/p 4:03:59 } +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1431/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 2.326949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.42461 samples/s/p 4:04:25 } +2024-07-25 21:05:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1433/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.3264229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:54,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43415 samples/s/p 4:03:56 } +2024-07-25 21:05:57,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1435/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.3258966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43566 samples/s/p 4:03:49 } +2024-07-25 21:06:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1437/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.3253704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:00,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43202 samples/s/p 4:03:56 } +2024-07-25 21:06:03,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1439/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.324844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43002 samples/s/p 4:03:58 } +2024-07-25 21:06:06,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1441/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.324317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43494 samples/s/p 4:03:42 } +2024-07-25 21:06:09,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1443/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3237904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:09,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43347 samples/s/p 4:03:43 } +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1445/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.3232637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.42698 samples/s/p 4:03:57 } +2024-07-25 21:06:15,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1447/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.3227365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:15,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43385 samples/s/p 4:03:36 } +2024-07-25 21:06:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1449/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 2.3222094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:18,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43117 samples/s/p 4:03:40 } +2024-07-25 21:06:21,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1451/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 2.321682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43250 samples/s/p 4:03:34 } +2024-07-25 21:06:24,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1453/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3211544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:24,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43335 samples/s/p 4:03:29 } +2024-07-25 21:06:27,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1455/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.3206267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43247 samples/s/p 4:03:28 } +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1457/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.3200992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43451 samples/s/p 4:03:20 } +2024-07-25 21:06:32,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1459/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.3195713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:32,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43084 samples/s/p 4:03:26 } +2024-07-25 21:06:35,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1461/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.319043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43530 samples/s/p 4:03:12 } +2024-07-25 21:06:38,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1463/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.3185148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:38,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43714 samples/s/p 4:03:04 } +2024-07-25 21:06:41,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1465/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.3179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:41,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.44243 samples/s/p 4:02:47 } +2024-07-25 21:06:44,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1467/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.317458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43381 samples/s/p 4:03:07 } +2024-07-25 21:06:47,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1469/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.3169294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:47,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43361 samples/s/p 4:03:04 } +2024-07-25 21:06:50,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1471/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 2.3164008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:50,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43458 samples/s/p 4:02:59 } +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1473/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.3158722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43721 samples/s/p 4:02:49 } +2024-07-25 21:06:56,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1475/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.3153427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:56,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43194 samples/s/p 4:03:00 } +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1477/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.3148137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43523 samples/s/p 4:02:48 } +2024-07-25 21:07:02,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1479/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.3142846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.42888 samples/s/p 4:03:02 } +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1481/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.313755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43457 samples/s/p 4:02:44 } +2024-07-25 21:07:08,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1483/ 1625], loss: 0.946, per_step_time: 1470ms, lr: 2.3132252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:08,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43921 samples/s/p 4:02:29 } +2024-07-25 21:07:11,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1485/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.3126957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:11,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43821 samples/s/p 4:02:28 } +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1487/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3121658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43083 samples/s/p 4:02:45 } +2024-07-25 21:07:17,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1489/ 1625], loss: 0.995, per_step_time: 1472ms, lr: 2.3116358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43183 samples/s/p 4:02:40 } +2024-07-25 21:07:20,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1491/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 2.3111055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43295 samples/s/p 4:02:34 } +2024-07-25 21:07:23,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1493/ 1625], loss: 0.977, per_step_time: 1473ms, lr: 2.3105753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:23,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43108 samples/s/p 4:02:36 } +2024-07-25 21:07:26,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1495/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.310045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43840 samples/s/p 4:02:13 } +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1497/ 1625], loss: 0.863, per_step_time: 1473ms, lr: 2.3095143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42826 samples/s/p 4:02:37 } +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1499/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.3089835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43476 samples/s/p 4:02:17 } +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1501/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3084529e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43528 samples/s/p 4:02:13 } +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1503/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.307922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43684 samples/s/p 4:02:06 } +2024-07-25 21:07:40,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1505/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.3073904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:40,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43425 samples/s/p 4:02:10 } +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1507/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3068595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43826 samples/s/p 4:01:56 } +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1509/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 2.306328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43064 samples/s/p 4:02:13 } +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1511/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.3057966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43923 samples/s/p 4:01:47 } +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1513/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.3052648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.42934 samples/s/p 4:02:11 } +2024-07-25 21:07:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1515/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3047329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43245 samples/s/p 4:02:00 } +2024-07-25 21:07:58,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1517/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.3042008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:58,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43322 samples/s/p 4:01:55 } +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1519/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3036688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43189 samples/s/p 4:01:55 } +2024-07-25 21:08:04,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1521/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.3031364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:04,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43770 samples/s/p 4:01:37 } +2024-07-25 21:08:07,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1523/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.302604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:07,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43666 samples/s/p 4:01:37 } +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1525/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3020715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43753 samples/s/p 4:01:31 } +2024-07-25 21:08:13,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1527/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.301539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:13,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43564 samples/s/p 4:01:33 } +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1529/ 1625], loss: 1.072, per_step_time: 1473ms, lr: 2.301006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43022 samples/s/p 4:01:45 } +2024-07-25 21:08:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1531/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.300473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43470 samples/s/p 4:01:30 } +2024-07-25 21:08:22,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1533/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.29994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43116 samples/s/p 4:01:37 } +2024-07-25 21:08:25,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1535/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 2.2994067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:25,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43530 samples/s/p 4:01:23 } +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1537/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.2988734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43818 samples/s/p 4:01:12 } +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1539/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.2983397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43740 samples/s/p 4:01:11 } +2024-07-25 21:08:33,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1541/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.2978062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.42679 samples/s/p 4:01:36 } +2024-07-25 21:08:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1543/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.2972723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:36,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43091 samples/s/p 4:01:23 } +2024-07-25 21:08:39,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1545/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 2.2967384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:39,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43316 samples/s/p 4:01:14 } +2024-07-25 21:08:42,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1547/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2962042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43784 samples/s/p 4:00:58 } +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1549/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.2956701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43589 samples/s/p 4:01:00 } +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1551/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.2951357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43780 samples/s/p 4:00:52 } +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1553/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.2946011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42593 samples/s/p 4:01:21 } +2024-07-25 21:08:54,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1555/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.2940667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43342 samples/s/p 4:00:58 } +2024-07-25 21:08:57,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1557/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 2.2935319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43673 samples/s/p 4:00:46 } +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1559/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.2929971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:00,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43333 samples/s/p 4:00:53 } +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1561/ 1625], loss: 1.404, per_step_time: 1473ms, lr: 2.292462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43049 samples/s/p 4:00:57 } +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1563/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.2919272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43453 samples/s/p 4:00:43 } +2024-07-25 21:09:09,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1565/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.2913915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:09,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43491 samples/s/p 4:00:39 } +2024-07-25 21:09:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1567/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.2908564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43443 samples/s/p 4:00:38 } +2024-07-25 21:09:15,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1569/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.2903208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43228 samples/s/p 4:00:41 } +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1571/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.2897852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43207 samples/s/p 4:00:38 } +2024-07-25 21:09:21,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1573/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.2892493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43352 samples/s/p 4:00:31 } +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1575/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.288713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43784 samples/s/p 4:00:17 } +2024-07-25 21:09:27,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1577/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.2881772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:27,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43577 samples/s/p 4:00:20 } +2024-07-25 21:09:30,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1579/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.2876407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43228 samples/s/p 4:00:26 } +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1581/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.2871045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43068 samples/s/p 4:00:27 } +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1583/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.286568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43333 samples/s/p 4:00:17 } +2024-07-25 21:09:38,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1585/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2860315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:38,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43557 samples/s/p 4:00:08 } +2024-07-25 21:09:41,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1587/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.2854943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:41,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43629 samples/s/p 4:00:03 } +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1589/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2849577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.42994 samples/s/p 4:00:17 } +2024-07-25 21:09:47,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1591/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2844208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:47,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43759 samples/s/p 3:59:54 } +2024-07-25 21:09:50,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1593/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.2838836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43623 samples/s/p 3:59:55 } +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1595/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.283346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43915 samples/s/p 3:59:44 } +2024-07-25 21:09:56,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1597/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.2828086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43402 samples/s/p 3:59:55 } +2024-07-25 21:09:59,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1599/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.282271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:59,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.44040 samples/s/p 3:59:35 } +2024-07-25 21:10:02,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1601/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.2817332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:02,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43703 samples/s/p 3:59:41 } +2024-07-25 21:10:05,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1603/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.2811953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:05,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43642 samples/s/p 3:59:40 } +2024-07-25 21:10:08,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1605/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.2806575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43892 samples/s/p 3:59:30 } +2024-07-25 21:10:11,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1607/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.2801192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43417 samples/s/p 3:59:40 } +2024-07-25 21:10:14,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1609/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.279581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.44061 samples/s/p 3:59:20 } +2024-07-25 21:10:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1611/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.2790426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:17,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43152 samples/s/p 3:59:41 } +2024-07-25 21:10:20,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1613/ 1625], loss: 1.236, per_step_time: 1476ms, lr: 2.278504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.41952 samples/s/p 4:00:10 } +2024-07-25 21:10:23,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1615/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2779652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:23,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43663 samples/s/p 3:59:21 } +2024-07-25 21:10:26,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1617/ 1625], loss: 0.985, per_step_time: 1472ms, lr: 2.2774264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:26,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43395 samples/s/p 3:59:25 } +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1619/ 1625], loss: 1.268, per_step_time: 1470ms, lr: 2.2768874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43977 samples/s/p 3:59:07 } +2024-07-25 21:10:32,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1621/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 2.2763483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:32,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43454 samples/s/p 3:59:18 } +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.2758091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43466 samples/s/p 3:59:15 } +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1625/ 1625], loss: 1.401, per_step_time: 1470ms, lr: 2.2752696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43901 samples/s/p 3:59:00 } +2024-07-25 21:10:40,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 2/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.2747303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43498 samples/s/p 3:59:08 } +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 4/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.2741906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43450 samples/s/p 3:59:06 } +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 6/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.2736509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.42847 samples/s/p 3:59:19 } +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 8/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.2731108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43493 samples/s/p 3:58:59 } +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 10/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.2725708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43797 samples/s/p 3:58:48 } +2024-07-25 21:10:55,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 12/ 1625], loss: 1.227, per_step_time: 1478ms, lr: 2.2720307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.41163 samples/s/p 3:59:55 } +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 14/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.2714903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43421 samples/s/p 3:58:52 } +2024-07-25 21:11:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 16/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.27095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:01,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42853 samples/s/p 3:59:04 } +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 18/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 2.2704093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43515 samples/s/p 3:58:44 } +2024-07-25 21:11:07,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 20/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.2698687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:07,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42828 samples/s/p 3:58:59 } +2024-07-25 21:11:10,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 22/ 1625], loss: 1.210, per_step_time: 1469ms, lr: 2.2693279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.44221 samples/s/p 3:58:20 } +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 24/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.268787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43235 samples/s/p 3:58:43 } +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 26/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.2682461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.44212 samples/s/p 3:58:14 } +2024-07-25 21:11:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 28/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.2677044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43543 samples/s/p 3:58:29 } +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 30/ 1625], loss: 1.344, per_step_time: 1474ms, lr: 2.2671631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42646 samples/s/p 3:58:49 } +2024-07-25 21:11:25,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 32/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.2666221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43314 samples/s/p 3:58:29 } +2024-07-25 21:11:28,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 34/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.2660804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:28,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43145 samples/s/p 3:58:30 } +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 36/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43533 samples/s/p 3:58:17 } +2024-07-25 21:11:33,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 38/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.2649967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:33,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43046 samples/s/p 3:58:27 } +2024-07-25 21:11:36,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 40/ 1625], loss: 1.410, per_step_time: 1471ms, lr: 2.2644546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43787 samples/s/p 3:58:05 } +2024-07-25 21:11:39,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 42/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.2639124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:39,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43531 samples/s/p 3:58:08 } +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 44/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2633702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43942 samples/s/p 3:57:55 } +2024-07-25 21:11:45,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 46/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.2628277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43930 samples/s/p 3:57:52 } +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 48/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.2622855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43602 samples/s/p 3:57:58 } +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 50/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.2617425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42901 samples/s/p 3:58:13 } +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 52/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 2.2611997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42744 samples/s/p 3:58:14 } +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 54/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2606571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43671 samples/s/p 3:57:47 } +2024-07-25 21:12:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 56/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.260114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43312 samples/s/p 3:57:53 } +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 58/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.2595706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43596 samples/s/p 3:57:43 } +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 60/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.2590275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43297 samples/s/p 3:57:48 } +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 62/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.258484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43387 samples/s/p 3:57:43 } +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 64/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.2579403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43669 samples/s/p 3:57:32 } +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 66/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.2573966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43669 samples/s/p 3:57:29 } +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 68/ 1625], loss: 1.121, per_step_time: 1477ms, lr: 2.2568527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.41612 samples/s/p 3:58:21 } +2024-07-25 21:12:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 70/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.2563088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:21,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43373 samples/s/p 3:57:31 } +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 72/ 1625], loss: 1.486, per_step_time: 1471ms, lr: 2.2557646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43522 samples/s/p 3:57:24 } +2024-07-25 21:12:27,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 74/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.2552204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43131 samples/s/p 3:57:32 } +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 76/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.254676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43554 samples/s/p 3:57:18 } +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 78/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.2541315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43760 samples/s/p 3:57:09 } +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 80/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.2535869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43085 samples/s/p 3:57:24 } +2024-07-25 21:12:38,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 82/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.2530421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:38,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43666 samples/s/p 3:57:06 } +2024-07-25 21:12:41,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 84/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 2.2524971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:41,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43297 samples/s/p 3:57:13 } +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 86/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.2519522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43348 samples/s/p 3:57:08 } +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 88/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.251407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.42781 samples/s/p 3:57:20 } +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 90/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 2.2508617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.42388 samples/s/p 3:57:28 } +2024-07-25 21:12:53,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 92/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.2503164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.44034 samples/s/p 3:56:42 } +2024-07-25 21:12:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 94/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.2497707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43417 samples/s/p 3:56:55 } +2024-07-25 21:12:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 96/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2492251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:59,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43568 samples/s/p 3:56:48 } +2024-07-25 21:13:02,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 98/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.2486793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43608 samples/s/p 3:56:44 } +2024-07-25 21:13:05,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 100/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.2481334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:05,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43488 samples/s/p 3:56:44 } +2024-07-25 21:13:08,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 102/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2475871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43602 samples/s/p 3:56:38 } +2024-07-25 21:13:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 104/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 2.247041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.44187 samples/s/p 3:56:20 } +2024-07-25 21:13:14,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 106/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.2464947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43878 samples/s/p 3:56:25 } +2024-07-25 21:13:17,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 108/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.245948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.44191 samples/s/p 3:56:14 } +2024-07-25 21:13:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 110/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.2454016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:20,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.42948 samples/s/p 3:56:43 } +2024-07-25 21:13:23,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 112/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.2448548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43779 samples/s/p 3:56:19 } +2024-07-25 21:13:26,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 114/ 1625], loss: 0.954, per_step_time: 1470ms, lr: 2.244308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:26,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43880 samples/s/p 3:56:13 } +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 116/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.2437613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.42976 samples/s/p 3:56:34 } +2024-07-25 21:13:32,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 118/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.243214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:32,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43011 samples/s/p 3:56:30 } +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 120/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.242667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43192 samples/s/p 3:56:22 } +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 122/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2421198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43316 samples/s/p 3:56:16 } +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 124/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 2.2415721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43934 samples/s/p 3:55:57 } +2024-07-25 21:13:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 126/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.2410246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42896 samples/s/p 3:56:21 } +2024-07-25 21:13:46,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 128/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2404767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:46,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43281 samples/s/p 3:56:08 } +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 130/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.239929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42826 samples/s/p 3:56:17 } +2024-07-25 21:13:52,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 132/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 2.2393811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:52,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43882 samples/s/p 3:55:47 } +2024-07-25 21:13:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 134/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.2388327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:55,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43703 samples/s/p 3:55:48 } +2024-07-25 21:13:58,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 136/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 2.2382847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43230 samples/s/p 3:55:58 } +2024-07-25 21:14:01,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 138/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.2377366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:01,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43691 samples/s/p 3:55:43 } +2024-07-25 21:14:04,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 140/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.2371878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:04,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.44180 samples/s/p 3:55:27 } +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 142/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.2366394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43060 samples/s/p 3:55:53 } +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 144/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2360906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43338 samples/s/p 3:55:43 } +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 146/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 2.2355418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43453 samples/s/p 3:55:37 } +2024-07-25 21:14:16,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 148/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2349928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:16,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43364 samples/s/p 3:55:37 } +2024-07-25 21:14:19,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 150/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2344437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:19,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43706 samples/s/p 3:55:25 } +2024-07-25 21:14:22,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 152/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.2338943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43219 samples/s/p 3:55:34 } +2024-07-25 21:14:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 154/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.233345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43780 samples/s/p 3:55:17 } +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 156/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.2327955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43279 samples/s/p 3:55:27 } +2024-07-25 21:14:31,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 158/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.232246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:31,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.42936 samples/s/p 3:55:33 } +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 160/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.2316963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43532 samples/s/p 3:55:15 } +2024-07-25 21:14:36,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 162/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.2311464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43421 samples/s/p 3:55:15 } +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 164/ 1625], loss: 1.055, per_step_time: 1469ms, lr: 2.2305963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.44309 samples/s/p 3:54:49 } +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 166/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.230046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43244 samples/s/p 3:55:13 } +2024-07-25 21:14:45,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 168/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.229496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:45,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43008 samples/s/p 3:55:16 } +2024-07-25 21:14:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 170/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2289454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:48,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43670 samples/s/p 3:54:56 } +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 172/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.2283948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43019 samples/s/p 3:55:10 } +2024-07-25 21:14:54,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 174/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2278444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44035 samples/s/p 3:54:41 } +2024-07-25 21:14:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 176/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.2272936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43352 samples/s/p 3:54:56 } +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 178/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.2267428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43550 samples/s/p 3:54:48 } +2024-07-25 21:15:03,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 180/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 2.2261916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:03,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44247 samples/s/p 3:54:27 } +2024-07-25 21:15:06,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 182/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2256405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:06,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43673 samples/s/p 3:54:39 } +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 184/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.2250892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43592 samples/s/p 3:54:38 } +2024-07-25 21:15:12,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 186/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 2.2245378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:12,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44175 samples/s/p 3:54:20 } +2024-07-25 21:15:15,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 188/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.2239865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:15,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43733 samples/s/p 3:54:28 } +2024-07-25 21:15:18,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 190/ 1625], loss: 1.009, per_step_time: 1469ms, lr: 2.2234346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.44343 samples/s/p 3:54:09 } +2024-07-25 21:15:21,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 192/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.2228829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:21,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43544 samples/s/p 3:54:27 } +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 194/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.222331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43185 samples/s/p 3:54:34 } +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 196/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.2217791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43286 samples/s/p 3:54:28 } +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 198/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.2212269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43739 samples/s/p 3:54:13 } +2024-07-25 21:15:33,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 200/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.2206747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:33,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43429 samples/s/p 3:54:18 } +2024-07-25 21:15:35,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 202/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.2201222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43059 samples/s/p 3:54:25 } +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 204/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.21957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43022 samples/s/p 3:54:23 } +2024-07-25 21:15:41,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 206/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2190172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.44163 samples/s/p 3:53:51 } +2024-07-25 21:15:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 208/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.2184644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43419 samples/s/p 3:54:07 } +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 210/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.2179118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43198 samples/s/p 3:54:10 } +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 212/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2173588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43667 samples/s/p 3:53:55 } +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 214/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 2.2168053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.42940 samples/s/p 3:54:10 } +2024-07-25 21:15:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 216/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2162525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43515 samples/s/p 3:53:53 } +2024-07-25 21:15:59,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.2156992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43658 samples/s/p 3:53:46 } +2024-07-25 21:16:02,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 220/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.2151457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:02,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43709 samples/s/p 3:53:42 } +2024-07-25 21:16:05,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 222/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.214592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43643 samples/s/p 3:53:40 } +2024-07-25 21:16:08,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 224/ 1625], loss: 0.893, per_step_time: 1471ms, lr: 2.2140382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:08,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43693 samples/s/p 3:53:36 } +2024-07-25 21:16:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 226/ 1625], loss: 1.085, per_step_time: 1470ms, lr: 2.2134847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43954 samples/s/p 3:53:27 } +2024-07-25 21:16:14,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 228/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2129307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43430 samples/s/p 3:53:37 } +2024-07-25 21:16:17,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 230/ 1625], loss: 0.865, per_step_time: 1471ms, lr: 2.2123762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:17,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43519 samples/s/p 3:53:32 } +2024-07-25 21:16:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 232/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.2118224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43245 samples/s/p 3:53:36 } +2024-07-25 21:16:23,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 234/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.211268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:23,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43263 samples/s/p 3:53:33 } +2024-07-25 21:16:26,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 236/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.2107135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:26,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43335 samples/s/p 3:53:28 } +2024-07-25 21:16:29,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 238/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.210159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:29,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43640 samples/s/p 3:53:17 } +2024-07-25 21:16:32,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 240/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.2096043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43613 samples/s/p 3:53:15 } +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 242/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.2090495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43604 samples/s/p 3:53:12 } +2024-07-25 21:16:37,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 244/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.2084943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43772 samples/s/p 3:53:05 } +2024-07-25 21:16:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2079394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:40,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43550 samples/s/p 3:53:08 } +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 248/ 1625], loss: 1.072, per_step_time: 1472ms, lr: 2.2073842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43208 samples/s/p 3:53:13 } +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 250/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.2068289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43473 samples/s/p 3:53:04 } +2024-07-25 21:16:49,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 252/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.2062733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.44057 samples/s/p 3:52:46 } +2024-07-25 21:16:52,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 254/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.2057178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42927 samples/s/p 3:53:12 } +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 256/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.2051621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43233 samples/s/p 3:53:01 } +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 258/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 2.2046064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42895 samples/s/p 3:53:07 } +2024-07-25 21:17:01,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 260/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.2040504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:01,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43579 samples/s/p 3:52:46 } +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 262/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.2034943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43380 samples/s/p 3:52:48 } +2024-07-25 21:17:07,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 264/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 2.2029382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:07,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43031 samples/s/p 3:52:54 } +2024-07-25 21:17:10,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 266/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.2023818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43202 samples/s/p 3:52:47 } +2024-07-25 21:17:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 268/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2018256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.44045 samples/s/p 3:52:22 } +2024-07-25 21:17:16,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 270/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.201269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:16,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43002 samples/s/p 3:52:46 } +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 272/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2007122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43949 samples/s/p 3:52:19 } +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 274/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.2001554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43840 samples/s/p 3:52:19 } +2024-07-25 21:17:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 276/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1995987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:25,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44170 samples/s/p 3:52:07 } +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 278/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.1990416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43634 samples/s/p 3:52:18 } +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 280/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.1984844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44083 samples/s/p 3:52:04 } +2024-07-25 21:17:34,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 282/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 2.1979271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:34,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43268 samples/s/p 3:52:22 } +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 284/ 1625], loss: 1.397, per_step_time: 1470ms, lr: 2.19737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43912 samples/s/p 3:52:02 } +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 286/ 1625], loss: 1.279, per_step_time: 1475ms, lr: 2.1968124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42161 samples/s/p 3:52:44 } +2024-07-25 21:17:42,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 288/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 2.1962549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43080 samples/s/p 3:52:18 } +2024-07-25 21:17:45,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 290/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.195697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:45,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43771 samples/s/p 3:51:57 } +2024-07-25 21:17:48,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 292/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.1951395e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43846 samples/s/p 3:51:52 } +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 294/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.1945816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43200 samples/s/p 3:52:06 } +2024-07-25 21:17:54,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 296/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.1940232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42929 samples/s/p 3:52:10 } +2024-07-25 21:17:57,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 298/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.1934653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:57,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43671 samples/s/p 3:51:48 } +2024-07-25 21:18:00,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 300/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.192907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43526 samples/s/p 3:51:49 } +2024-07-25 21:18:03,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 302/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1923484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:03,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43542 samples/s/p 3:51:45 } +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 304/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.1917898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42845 samples/s/p 3:52:00 } +2024-07-25 21:18:09,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 306/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.1912314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:09,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43218 samples/s/p 3:51:48 } +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 308/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1906724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42832 samples/s/p 3:51:55 } +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 310/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.1901134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43417 samples/s/p 3:51:37 } +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 312/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.1895545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42732 samples/s/p 3:51:51 } +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 314/ 1625], loss: 1.071, per_step_time: 1477ms, lr: 2.1889953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.41480 samples/s/p 3:52:21 } +2024-07-25 21:18:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 316/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.1884363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.44101 samples/s/p 3:51:10 } +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 318/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.1878766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43395 samples/s/p 3:51:26 } +2024-07-25 21:18:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 320/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.1873175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43020 samples/s/p 3:51:32 } +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 322/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.186758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.42967 samples/s/p 3:51:31 } +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 324/ 1625], loss: 0.832, per_step_time: 1471ms, lr: 2.1861983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43503 samples/s/p 3:51:14 } +2024-07-25 21:18:38,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 326/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 2.1856382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:38,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43956 samples/s/p 3:50:59 } +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 328/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 2.1850783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43849 samples/s/p 3:50:59 } +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 330/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1845182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43426 samples/s/p 3:51:07 } +2024-07-25 21:18:47,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.183958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:47,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43478 samples/s/p 3:51:03 } +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 334/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.1833976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43619 samples/s/p 3:50:56 } +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 336/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.1828373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43984 samples/s/p 3:50:44 } +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 338/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.1822767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43831 samples/s/p 3:50:45 } +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 340/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.1817159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43397 samples/s/p 3:50:53 } +2024-07-25 21:19:02,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 342/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.1811553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:02,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43886 samples/s/p 3:50:38 } +2024-07-25 21:19:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 344/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.1805943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:05,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43644 samples/s/p 3:50:41 } +2024-07-25 21:19:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 346/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.1800332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43523 samples/s/p 3:50:41 } +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 348/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.1794722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43882 samples/s/p 3:50:29 } +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 350/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.1789108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43871 samples/s/p 3:50:26 } +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 352/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.1783495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:17,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43435 samples/s/p 3:50:34 } +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 354/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.177788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43790 samples/s/p 3:50:22 } +2024-07-25 21:19:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 356/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.1772265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44075 samples/s/p 3:50:12 } +2024-07-25 21:19:26,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 358/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.1766646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:26,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43362 samples/s/p 3:50:27 } +2024-07-25 21:19:29,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 360/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.1761029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:29,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43503 samples/s/p 3:50:21 } +2024-07-25 21:19:32,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 362/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 2.1755408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43061 samples/s/p 3:50:29 } +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 364/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.1749787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44024 samples/s/p 3:50:02 } +2024-07-25 21:19:37,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 366/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 2.1744167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:37,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43536 samples/s/p 3:50:11 } +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 368/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.1738544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44143 samples/s/p 3:49:53 } +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 370/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.173292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:43,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43540 samples/s/p 3:50:05 } +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 372/ 1625], loss: 0.984, per_step_time: 1469ms, lr: 2.1727295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44471 samples/s/p 3:49:39 } +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1721668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43608 samples/s/p 3:49:58 } +2024-07-25 21:19:52,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 376/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.1716038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43321 samples/s/p 3:50:02 } +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 378/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.171041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43374 samples/s/p 3:49:58 } +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 380/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.170478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43743 samples/s/p 3:49:45 } +2024-07-25 21:20:01,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 382/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.1699154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:01,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43188 samples/s/p 3:49:57 } +2024-07-25 21:20:04,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 384/ 1625], loss: 1.186, per_step_time: 1469ms, lr: 2.169352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:04,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.44387 samples/s/p 3:49:23 } +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 386/ 1625], loss: 1.215, per_step_time: 1474ms, lr: 2.1687883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42613 samples/s/p 3:50:05 } +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 388/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.1682252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43562 samples/s/p 3:49:38 } +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 390/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.1676618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42971 samples/s/p 3:49:50 } +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 392/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.1670981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42944 samples/s/p 3:49:48 } +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 394/ 1625], loss: 1.016, per_step_time: 1473ms, lr: 2.1665343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43042 samples/s/p 3:49:43 } +2024-07-25 21:20:22,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 396/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.1659704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:22,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43845 samples/s/p 3:49:19 } +2024-07-25 21:20:25,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 398/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 2.1654067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43009 samples/s/p 3:49:38 } +2024-07-25 21:20:28,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 400/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.1648422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43079 samples/s/p 3:49:33 } +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 402/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.164278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43423 samples/s/p 3:49:21 } +2024-07-25 21:20:34,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 404/ 1625], loss: 1.232, per_step_time: 1474ms, lr: 2.1637139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42424 samples/s/p 3:49:44 } +2024-07-25 21:20:36,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 406/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.1631497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44036 samples/s/p 3:49:00 } +2024-07-25 21:20:39,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 408/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.1625845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43156 samples/s/p 3:49:19 } +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 410/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.1620202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43559 samples/s/p 3:49:06 } +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 412/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.1614554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44015 samples/s/p 3:48:51 } +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 414/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.1608905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42988 samples/s/p 3:49:14 } +2024-07-25 21:20:51,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 416/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.1603255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:51,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43937 samples/s/p 3:48:48 } +2024-07-25 21:20:54,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 418/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.1597603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43786 samples/s/p 3:48:48 } +2024-07-25 21:20:57,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 420/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.159195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.42833 samples/s/p 3:49:10 } +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 422/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.1586296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43687 samples/s/p 3:48:45 } +2024-07-25 21:21:03,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 424/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.1580643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:03,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43785 samples/s/p 3:48:40 } +2024-07-25 21:21:06,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 426/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.1574986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:06,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44180 samples/s/p 3:48:27 } +2024-07-25 21:21:09,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 428/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1569329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:09,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43879 samples/s/p 3:48:31 } +2024-07-25 21:21:12,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 430/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.1563672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:12,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43995 samples/s/p 3:48:26 } +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 432/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1558013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44165 samples/s/p 3:48:18 } +2024-07-25 21:21:18,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 434/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.1552352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43334 samples/s/p 3:48:36 } +2024-07-25 21:21:21,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 436/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.1546688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43675 samples/s/p 3:48:25 } +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 438/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.1541025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42827 samples/s/p 3:48:43 } +2024-07-25 21:21:27,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 440/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.1535363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:27,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43399 samples/s/p 3:48:26 } +2024-07-25 21:21:30,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 442/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.1529699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:30,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43477 samples/s/p 3:48:21 } +2024-07-25 21:21:33,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 444/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 2.1524032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42940 samples/s/p 3:48:32 } +2024-07-25 21:21:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 446/ 1625], loss: 1.057, per_step_time: 1469ms, lr: 2.1518365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:36,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44262 samples/s/p 3:47:55 } +2024-07-25 21:21:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 448/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.1512697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43464 samples/s/p 3:48:12 } +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 450/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.1507029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43159 samples/s/p 3:48:17 } +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 452/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.1501357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43309 samples/s/p 3:48:10 } +2024-07-25 21:21:47,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 454/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.1495687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:47,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.42579 samples/s/p 3:48:26 } +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 456/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 2.1490014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43509 samples/s/p 3:47:59 } +2024-07-25 21:21:53,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 458/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.148434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:53,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43179 samples/s/p 3:48:05 } +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 460/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.1478665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43751 samples/s/p 3:47:48 } +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 462/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.147299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43629 samples/s/p 3:47:48 } +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 464/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.1467313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43457 samples/s/p 3:47:49 } +2024-07-25 21:22:05,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 466/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.1461634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.42969 samples/s/p 3:47:58 } +2024-07-25 21:22:08,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 468/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.1455955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43480 samples/s/p 3:47:43 } +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 470/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.1450276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43652 samples/s/p 3:47:35 } +2024-07-25 21:22:14,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 472/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 2.1444595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:14,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43352 samples/s/p 3:47:40 } +2024-07-25 21:22:17,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 474/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.143891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.44131 samples/s/p 3:47:17 } +2024-07-25 21:22:20,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 476/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.1433229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:20,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43530 samples/s/p 3:47:30 } +2024-07-25 21:22:23,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 478/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 2.1427542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:23,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43098 samples/s/p 3:47:37 } +2024-07-25 21:22:26,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 480/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.1421858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:26,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43618 samples/s/p 3:47:21 } +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.141617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43877 samples/s/p 3:47:12 } +2024-07-25 21:22:32,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 484/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 2.1410482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44306 samples/s/p 3:46:58 } +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 486/ 1625], loss: 1.282, per_step_time: 1468ms, lr: 2.1404794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44695 samples/s/p 3:46:46 } +2024-07-25 21:22:37,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 488/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1399102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43510 samples/s/p 3:47:12 } +2024-07-25 21:22:40,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 490/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.139341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:40,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44096 samples/s/p 3:46:55 } +2024-07-25 21:22:43,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 492/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.1387721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43381 samples/s/p 3:47:10 } +2024-07-25 21:22:46,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 494/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.1382028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43316 samples/s/p 3:47:08 } +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 496/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 2.137633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43738 samples/s/p 3:46:55 } +2024-07-25 21:22:52,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 498/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.1370637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:52,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43483 samples/s/p 3:46:58 } +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 500/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.136494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43737 samples/s/p 3:46:49 } +2024-07-25 21:22:55,671 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 502/ 1625], loss: 1.250, per_step_time: 2789ms, lr: 2.1359243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 2.86764 samples/s/p 7:09:59 } +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 504/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.1353544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.42043 samples/s/p 3:47:26 } +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 506/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.1347843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43564 samples/s/p 3:46:45 } +2024-07-25 21:23:40,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 508/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1342143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:40,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43064 samples/s/p 3:46:54 } +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 510/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 2.133644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43568 samples/s/p 3:46:39 } +2024-07-25 21:23:46,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 512/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.1330738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:46,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43039 samples/s/p 3:46:49 } +2024-07-25 21:23:49,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 514/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 2.1325033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:49,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43808 samples/s/p 3:46:27 } +2024-07-25 21:23:52,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 516/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.1319329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:52,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43230 samples/s/p 3:46:38 } +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.1313623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43166 samples/s/p 3:46:37 } +2024-07-25 21:23:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 520/ 1625], loss: 1.310, per_step_time: 1473ms, lr: 2.1307915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:57,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43034 samples/s/p 3:46:37 } +2024-07-25 21:24:00,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 522/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.1302207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:00,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43806 samples/s/p 3:46:15 } +2024-07-25 21:24:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 524/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.1296497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:03,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43635 samples/s/p 3:46:16 } +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 526/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.1290785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43404 samples/s/p 3:46:19 } +2024-07-25 21:24:09,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 528/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.1285074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:09,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43742 samples/s/p 3:46:08 } +2024-07-25 21:24:12,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 530/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 2.1279362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:12,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.44379 samples/s/p 3:45:49 } +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 532/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 2.1273649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43922 samples/s/p 3:45:57 } +2024-07-25 21:24:18,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 534/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.1267933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43539 samples/s/p 3:46:04 } +2024-07-25 21:24:21,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 536/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.1262214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43552 samples/s/p 3:46:01 } +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 538/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.1256501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43542 samples/s/p 3:45:58 } +2024-07-25 21:24:27,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 540/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 2.125078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:27,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43591 samples/s/p 3:45:54 } +2024-07-25 21:24:30,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 542/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.1245063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43615 samples/s/p 3:45:50 } +2024-07-25 21:24:33,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 544/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.1239342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43305 samples/s/p 3:45:55 } +2024-07-25 21:24:36,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 546/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.1233622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:36,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44038 samples/s/p 3:45:34 } +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 548/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.12279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43361 samples/s/p 3:45:48 } +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 550/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.1222175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43890 samples/s/p 3:45:32 } +2024-07-25 21:24:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 552/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 2.121645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43720 samples/s/p 3:45:33 } +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 554/ 1625], loss: 0.905, per_step_time: 1470ms, lr: 2.1210728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43894 samples/s/p 3:45:26 } +2024-07-25 21:24:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 556/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.1204998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:51,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43205 samples/s/p 3:45:40 } +2024-07-25 21:24:53,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 558/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.119927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44007 samples/s/p 3:45:17 } +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 560/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.1193544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43360 samples/s/p 3:45:30 } +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 562/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 2.1187814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43858 samples/s/p 3:45:15 } +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 564/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.118208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43885 samples/s/p 3:45:11 } +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 566/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.1176353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.44215 samples/s/p 3:45:00 } +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 568/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.117062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43327 samples/s/p 3:45:19 } +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 570/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.1164886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.42864 samples/s/p 3:45:28 } +2024-07-25 21:25:14,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 572/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.1159149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:14,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43281 samples/s/p 3:45:14 } +2024-07-25 21:25:17,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 574/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.1153413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:17,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43417 samples/s/p 3:45:08 } +2024-07-25 21:25:20,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 576/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.1147678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:20,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43104 samples/s/p 3:45:13 } +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 578/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 2.1141937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.44420 samples/s/p 3:44:37 } +2024-07-25 21:25:26,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 580/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.1136198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43338 samples/s/p 3:45:01 } +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 582/ 1625], loss: 1.226, per_step_time: 1475ms, lr: 2.113046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42371 samples/s/p 3:45:22 } +2024-07-25 21:25:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 584/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.1124719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:32,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42830 samples/s/p 3:45:08 } +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 586/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1118974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43356 samples/s/p 3:44:52 } +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 588/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1113232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43811 samples/s/p 3:44:38 } +2024-07-25 21:25:41,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 590/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.110749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:41,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42993 samples/s/p 3:44:55 } +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 592/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.1101741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42855 samples/s/p 3:44:56 } +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 594/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 2.1095995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43457 samples/s/p 3:44:38 } +2024-07-25 21:25:50,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 596/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.1090249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:50,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43575 samples/s/p 3:44:32 } +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 598/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 2.1084501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44021 samples/s/p 3:44:18 } +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 600/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.107875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44031 samples/s/p 3:44:15 } +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 602/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.1073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43669 samples/s/p 3:44:21 } +2024-07-25 21:26:01,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 604/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.106725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:01,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42800 samples/s/p 3:44:39 } +2024-07-25 21:26:04,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 606/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.1061498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:04,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43120 samples/s/p 3:44:28 } +2024-07-25 21:26:07,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 608/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.1055741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42829 samples/s/p 3:44:33 } +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 610/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.104999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44151 samples/s/p 3:43:57 } +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 612/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.1044234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44354 samples/s/p 3:43:49 } +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 614/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.1038477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43919 samples/s/p 3:43:57 } +2024-07-25 21:26:19,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 616/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.1032718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43484 samples/s/p 3:44:05 } +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 618/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.1026959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43303 samples/s/p 3:44:06 } +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 620/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.1021202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43580 samples/s/p 3:43:56 } +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 622/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 2.101544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43468 samples/s/p 3:43:56 } +2024-07-25 21:26:31,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 624/ 1625], loss: 1.141, per_step_time: 1475ms, lr: 2.1009677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.42288 samples/s/p 3:44:22 } +2024-07-25 21:26:34,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 626/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.1003914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.42392 samples/s/p 3:44:17 } +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 628/ 1625], loss: 1.325, per_step_time: 1484ms, lr: 2.0998152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.38973 samples/s/p 3:45:39 } +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 630/ 1625], loss: 0.967, per_step_time: 1469ms, lr: 2.0992386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44238 samples/s/p 3:43:25 } +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 632/ 1625], loss: 1.023, per_step_time: 1470ms, lr: 2.0986621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44085 samples/s/p 3:43:26 } +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 634/ 1625], loss: 1.285, per_step_time: 1477ms, lr: 2.0980855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.41382 samples/s/p 3:44:30 } +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 636/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.0975087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43825 samples/s/p 3:43:27 } +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 638/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.0969317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43610 samples/s/p 3:43:29 } +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 640/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.0963547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43469 samples/s/p 3:43:30 } +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 642/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.0957777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43292 samples/s/p 3:43:31 } +2024-07-25 21:27:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 644/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.0952004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43155 samples/s/p 3:43:31 } +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 646/ 1625], loss: 0.978, per_step_time: 1472ms, lr: 2.094623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43190 samples/s/p 3:43:28 } +2024-07-25 21:27:06,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 648/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.0940459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:06,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43822 samples/s/p 3:43:09 } +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 650/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.0934684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42986 samples/s/p 3:43:27 } +2024-07-25 21:27:12,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 652/ 1625], loss: 0.972, per_step_time: 1473ms, lr: 2.0928905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43031 samples/s/p 3:43:23 } +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 654/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.0923131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43896 samples/s/p 3:42:59 } +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 656/ 1625], loss: 0.980, per_step_time: 1473ms, lr: 2.0917352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42914 samples/s/p 3:43:20 } +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 658/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0911573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42795 samples/s/p 3:43:20 } +2024-07-25 21:27:24,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 660/ 1625], loss: 1.027, per_step_time: 1482ms, lr: 2.0905793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.39482 samples/s/p 3:44:39 } +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 662/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.0900014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.42851 samples/s/p 3:43:13 } +2024-07-25 21:27:30,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 664/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0894231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43997 samples/s/p 3:42:41 } +2024-07-25 21:27:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 666/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.0888447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43879 samples/s/p 3:42:41 } +2024-07-25 21:27:36,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 668/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.0882664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43563 samples/s/p 3:42:46 } +2024-07-25 21:27:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 670/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.087688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:39,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43372 samples/s/p 3:42:48 } +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 672/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0871095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43908 samples/s/p 3:42:32 } +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 674/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.0865305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43086 samples/s/p 3:42:49 } +2024-07-25 21:27:48,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 676/ 1625], loss: 0.871, per_step_time: 1471ms, lr: 2.085952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:48,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43777 samples/s/p 3:42:29 } +2024-07-25 21:27:51,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 678/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.085373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:51,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43681 samples/s/p 3:42:28 } +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 680/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.0847941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43366 samples/s/p 3:42:33 } +2024-07-25 21:27:57,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 682/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.084215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:57,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.42859 samples/s/p 3:42:43 } +2024-07-25 21:27:59,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 684/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 2.0836358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:59,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43618 samples/s/p 3:42:21 } +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 686/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.0830565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.44163 samples/s/p 3:42:05 } +2024-07-25 21:28:05,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 688/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.0824771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:05,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43580 samples/s/p 3:42:16 } +2024-07-25 21:28:08,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 690/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.0818976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43609 samples/s/p 3:42:13 } +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 692/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.081318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43936 samples/s/p 3:42:02 } +2024-07-25 21:28:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 694/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 2.0807383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44226 samples/s/p 3:41:52 } +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 696/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0801584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43692 samples/s/p 3:42:02 } +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 698/ 1625], loss: 1.093, per_step_time: 1474ms, lr: 2.0795787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.42678 samples/s/p 3:42:24 } +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 700/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.0789988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43317 samples/s/p 3:42:05 } +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 702/ 1625], loss: 0.915, per_step_time: 1471ms, lr: 2.0784188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43491 samples/s/p 3:41:58 } +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 704/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.0778387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43197 samples/s/p 3:42:02 } +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 706/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.0772584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43829 samples/s/p 3:41:44 } +2024-07-25 21:28:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 708/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.076678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:35,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43794 samples/s/p 3:41:42 } +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 710/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.0760977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43298 samples/s/p 3:41:51 } +2024-07-25 21:28:41,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 712/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 2.075517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43158 samples/s/p 3:41:51 } +2024-07-25 21:28:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 714/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.0749363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42947 samples/s/p 3:41:54 } +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 716/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 2.0743557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43164 samples/s/p 3:41:45 } +2024-07-25 21:28:50,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 718/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 2.0737749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42466 samples/s/p 3:41:59 } +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 720/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.0731939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43243 samples/s/p 3:41:37 } +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 722/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.0726127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43630 samples/s/p 3:41:25 } +2024-07-25 21:28:58,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 724/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.0720316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:58,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43623 samples/s/p 3:41:22 } +2024-07-25 21:29:01,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 726/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 2.0714504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:01,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43748 samples/s/p 3:41:16 } +2024-07-25 21:29:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 728/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.070869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:04,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43113 samples/s/p 3:41:29 } +2024-07-25 21:29:07,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 730/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0702877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:07,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43176 samples/s/p 3:41:24 } +2024-07-25 21:29:10,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 732/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 2.0697064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43626 samples/s/p 3:41:10 } +2024-07-25 21:29:13,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 734/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.0691246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:13,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43948 samples/s/p 3:41:00 } +2024-07-25 21:29:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 736/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.0685427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.42862 samples/s/p 3:41:23 } +2024-07-25 21:29:19,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 738/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.067961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:19,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43671 samples/s/p 3:41:00 } +2024-07-25 21:29:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 740/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.0673793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:22,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43799 samples/s/p 3:40:54 } +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 742/ 1625], loss: 1.292, per_step_time: 1473ms, lr: 2.066797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:25,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43087 samples/s/p 3:41:09 } +2024-07-25 21:29:28,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 744/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.0662152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43404 samples/s/p 3:40:58 } +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 746/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.0656329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43718 samples/s/p 3:40:48 } +2024-07-25 21:29:34,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 748/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0650506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:34,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43062 samples/s/p 3:41:01 } +2024-07-25 21:29:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 750/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0644682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43949 samples/s/p 3:40:36 } +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 752/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0638858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43254 samples/s/p 3:40:50 } +2024-07-25 21:29:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 754/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.0633033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:43,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43140 samples/s/p 3:40:50 } +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 756/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.0627205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43877 samples/s/p 3:40:29 } +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 758/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.0621379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43653 samples/s/p 3:40:31 } +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 760/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.061555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44306 samples/s/p 3:40:13 } +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 762/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.0609721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43699 samples/s/p 3:40:24 } +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 764/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.060389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43976 samples/s/p 3:40:15 } +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 766/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0598058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43507 samples/s/p 3:40:23 } +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 768/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.0592226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44010 samples/s/p 3:40:08 } +2024-07-25 21:30:06,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 770/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.0586393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44176 samples/s/p 3:40:01 } +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 772/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 2.0580559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43029 samples/s/p 3:40:26 } +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 774/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.0574724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43150 samples/s/p 3:40:20 } +2024-07-25 21:30:15,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 776/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.056889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43115 samples/s/p 3:40:18 } +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 778/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 2.0563051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43574 samples/s/p 3:40:04 } +2024-07-25 21:30:21,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 780/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0557212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:21,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43731 samples/s/p 3:39:57 } +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 782/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.0551375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44142 samples/s/p 3:39:44 } +2024-07-25 21:30:27,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 784/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.0545536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:27,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43459 samples/s/p 3:39:58 } +2024-07-25 21:30:30,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 786/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.0539694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:30,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44064 samples/s/p 3:39:40 } +2024-07-25 21:30:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 788/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 2.0533853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44113 samples/s/p 3:39:36 } +2024-07-25 21:30:36,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 790/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.052801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43806 samples/s/p 3:39:41 } +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 792/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.0522168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43761 samples/s/p 3:39:39 } +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 794/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.0516321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.42933 samples/s/p 3:39:56 } +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 796/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.0510477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43923 samples/s/p 3:39:29 } +2024-07-25 21:30:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 798/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 2.0504633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43429 samples/s/p 3:39:38 } +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 800/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0498783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:51,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43844 samples/s/p 3:39:25 } +2024-07-25 21:30:54,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 802/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.0492935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43060 samples/s/p 3:39:41 } +2024-07-25 21:30:57,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 804/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.0487088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:57,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43293 samples/s/p 3:39:32 } +2024-07-25 21:30:59,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 806/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.0481237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:59,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43817 samples/s/p 3:39:17 } +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 808/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.0475385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43438 samples/s/p 3:39:23 } +2024-07-25 21:31:05,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 810/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 2.0469535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:05,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.42994 samples/s/p 3:39:31 } +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 812/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.0463682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43195 samples/s/p 3:39:23 } +2024-07-25 21:31:11,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 814/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0457828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43565 samples/s/p 3:39:11 } +2024-07-25 21:31:14,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 816/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.0451973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:14,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43373 samples/s/p 3:39:13 } +2024-07-25 21:31:17,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 818/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.044612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:17,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43273 samples/s/p 3:39:12 } +2024-07-25 21:31:20,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 820/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.0440262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:20,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43866 samples/s/p 3:38:55 } +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 822/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0434405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43225 samples/s/p 3:39:08 } +2024-07-25 21:31:26,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 824/ 1625], loss: 1.036, per_step_time: 1476ms, lr: 2.0428546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:26,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.41909 samples/s/p 3:39:37 } +2024-07-25 21:31:29,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 826/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.0422689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:29,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43313 samples/s/p 3:39:00 } +2024-07-25 21:31:32,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 828/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0416826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:32,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43248 samples/s/p 3:38:58 } +2024-07-25 21:31:35,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 830/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.0410966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43628 samples/s/p 3:38:46 } +2024-07-25 21:31:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 832/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 2.0405107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:38,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.42969 samples/s/p 3:38:59 } +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 834/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0399242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.44026 samples/s/p 3:38:31 } +2024-07-25 21:31:44,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 836/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.039338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:44,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43601 samples/s/p 3:38:38 } +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 838/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.0387515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.42921 samples/s/p 3:38:51 } +2024-07-25 21:31:50,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 840/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.0381647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:50,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43049 samples/s/p 3:38:45 } +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 842/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.037578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44139 samples/s/p 3:38:16 } +2024-07-25 21:31:56,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 844/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.0369915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43445 samples/s/p 3:38:30 } +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 846/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 2.0364047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44173 samples/s/p 3:38:09 } +2024-07-25 21:32:01,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 848/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.035818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:01,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43316 samples/s/p 3:38:27 } +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 850/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.0352309e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43472 samples/s/p 3:38:20 } +2024-07-25 21:32:07,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 852/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.0346435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:07,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43434 samples/s/p 3:38:18 } +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 854/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 2.0340565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43401 samples/s/p 3:38:16 } +2024-07-25 21:32:13,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 856/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.0334694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:13,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43966 samples/s/p 3:38:00 } +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 858/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.032882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43809 samples/s/p 3:38:01 } +2024-07-25 21:32:19,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 860/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.0322945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:19,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43343 samples/s/p 3:38:09 } +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 862/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.031707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43365 samples/s/p 3:38:05 } +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 864/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.0311192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43668 samples/s/p 3:37:55 } +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 866/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.0305315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43254 samples/s/p 3:38:02 } +2024-07-25 21:32:31,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 868/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 2.0299438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:31,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43048 samples/s/p 3:38:04 } +2024-07-25 21:32:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 870/ 1625], loss: 1.496, per_step_time: 1473ms, lr: 2.0293563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:34,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43082 samples/s/p 3:38:00 } +2024-07-25 21:32:37,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 872/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.0287682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:37,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43875 samples/s/p 3:37:38 } +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 874/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.0281801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.42865 samples/s/p 3:38:00 } +2024-07-25 21:32:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 876/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 2.0275918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44448 samples/s/p 3:37:19 } +2024-07-25 21:32:46,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 878/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.0270036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43447 samples/s/p 3:37:40 } +2024-07-25 21:32:49,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 880/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.0264153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43801 samples/s/p 3:37:28 } +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 882/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0258269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44117 samples/s/p 3:37:18 } +2024-07-25 21:32:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 884/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0252384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:55,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43782 samples/s/p 3:37:23 } +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 886/ 1625], loss: 1.130, per_step_time: 1474ms, lr: 2.0246498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.42611 samples/s/p 3:37:48 } +2024-07-25 21:33:00,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 888/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.0240614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:00,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43385 samples/s/p 3:37:27 } +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 890/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.0234722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43113 samples/s/p 3:37:30 } +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 892/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 2.0228836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43520 samples/s/p 3:37:17 } +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 894/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.0222948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43880 samples/s/p 3:37:06 } +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 896/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.0217056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43513 samples/s/p 3:37:12 } +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 898/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.0211166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43813 samples/s/p 3:37:02 } +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 900/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.0205272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43705 samples/s/p 3:37:01 } +2024-07-25 21:33:21,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 902/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.019938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:21,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43519 samples/s/p 3:37:03 } +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 904/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.0193487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43554 samples/s/p 3:36:59 } +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 906/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.0187592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43434 samples/s/p 3:36:59 } +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 908/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.0181697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.42743 samples/s/p 3:37:13 } +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 910/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.0175801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:33,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43619 samples/s/p 3:36:49 } +2024-07-25 21:33:36,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 912/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0169902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:36,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43682 samples/s/p 3:36:44 } +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 914/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.0164005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43918 samples/s/p 3:36:36 } +2024-07-25 21:33:42,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 916/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.0158106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:42,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43384 samples/s/p 3:36:45 } +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 918/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.0152207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43392 samples/s/p 3:36:42 } +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 920/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.0146306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43774 samples/s/p 3:36:30 } +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 922/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0140405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43483 samples/s/p 3:36:34 } +2024-07-25 21:33:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 924/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.0134501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43031 samples/s/p 3:36:42 } +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 926/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.0128598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43175 samples/s/p 3:36:36 } +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 928/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0122696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43353 samples/s/p 3:36:28 } +2024-07-25 21:34:02,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 930/ 1625], loss: 1.146, per_step_time: 1474ms, lr: 2.011679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:02,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42459 samples/s/p 3:36:47 } +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 932/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 2.0110887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43851 samples/s/p 3:36:11 } +2024-07-25 21:34:08,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 934/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.0104979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:08,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43393 samples/s/p 3:36:19 } +2024-07-25 21:34:11,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 936/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.009907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43445 samples/s/p 3:36:15 } +2024-07-25 21:34:14,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 938/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0093163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43534 samples/s/p 3:36:09 } +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 940/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 2.0087255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43742 samples/s/p 3:36:02 } +2024-07-25 21:34:20,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 942/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.0081343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43347 samples/s/p 3:36:08 } +2024-07-25 21:34:23,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 944/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.0075433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:23,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43518 samples/s/p 3:36:01 } +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 946/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.0069521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43545 samples/s/p 3:35:57 } +2024-07-25 21:34:29,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 948/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.0063608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43313 samples/s/p 3:36:00 } +2024-07-25 21:34:32,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 950/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.0057694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43464 samples/s/p 3:35:53 } +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 952/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.005178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43057 samples/s/p 3:36:00 } +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 954/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.0045867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43471 samples/s/p 3:35:47 } +2024-07-25 21:34:41,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 956/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.003995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43004 samples/s/p 3:35:56 } +2024-07-25 21:34:44,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 958/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.0034033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:44,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43517 samples/s/p 3:35:40 } +2024-07-25 21:34:47,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 960/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.0028117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.44296 samples/s/p 3:35:19 } +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 962/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0022198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43763 samples/s/p 3:35:29 } +2024-07-25 21:34:53,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 964/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.0016278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43511 samples/s/p 3:35:32 } +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 966/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0010359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43179 samples/s/p 3:35:37 } +2024-07-25 21:34:59,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 968/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0004436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:59,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43649 samples/s/p 3:35:23 } +2024-07-25 21:35:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 970/ 1625], loss: 1.516, per_step_time: 1473ms, lr: 1.9998517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:01,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43094 samples/s/p 3:35:33 } +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 972/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.9992593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43249 samples/s/p 3:35:26 } +2024-07-25 21:35:07,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 974/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.998667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43168 samples/s/p 3:35:25 } +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 976/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.9980747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43590 samples/s/p 3:35:12 } +2024-07-25 21:35:13,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 978/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.997482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:13,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43620 samples/s/p 3:35:09 } +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 980/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 1.9968895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.42958 samples/s/p 3:35:21 } +2024-07-25 21:35:19,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 982/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.9962969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:19,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43626 samples/s/p 3:35:02 } +2024-07-25 21:35:22,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 984/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9957042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:22,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43318 samples/s/p 3:35:07 } +2024-07-25 21:35:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 986/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.995111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42873 samples/s/p 3:35:14 } +2024-07-25 21:35:28,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 988/ 1625], loss: 1.168, per_step_time: 1475ms, lr: 1.9945184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:28,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42229 samples/s/p 3:35:27 } +2024-07-25 21:35:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 990/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 1.9939254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42753 samples/s/p 3:35:11 } +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 992/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 1.9933323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43214 samples/s/p 3:34:58 } +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 994/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.992739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43327 samples/s/p 3:34:52 } +2024-07-25 21:35:40,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 996/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.992146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43945 samples/s/p 3:34:34 } +2024-07-25 21:35:43,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 998/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.9915527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:43,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43659 samples/s/p 3:34:38 } +2024-07-25 21:35:46,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1000/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.9909592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:46,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44161 samples/s/p 3:34:23 } +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1002/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9903657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44092 samples/s/p 3:34:22 } +2024-07-25 21:35:52,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1004/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.9897721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:52,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43429 samples/s/p 3:34:35 } +2024-07-25 21:35:55,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1006/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9891784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44044 samples/s/p 3:34:17 } +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1008/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.9885845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43359 samples/s/p 3:34:31 } +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1010/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.987991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43864 samples/s/p 3:34:16 } +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1012/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.987397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43351 samples/s/p 3:34:25 } +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1014/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 1.9868032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43210 samples/s/p 3:34:25 } +2024-07-25 21:36:09,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1016/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 1.986209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:09,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42791 samples/s/p 3:34:32 } +2024-07-25 21:36:12,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1018/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.9856148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:12,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43319 samples/s/p 3:34:17 } +2024-07-25 21:36:15,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1020/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 1.9850208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:15,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43252 samples/s/p 3:34:15 } +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1022/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.9844263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42955 samples/s/p 3:34:20 } +2024-07-25 21:36:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1024/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.9838319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:21,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43246 samples/s/p 3:34:10 } +2024-07-25 21:36:24,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1026/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9832376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:24,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43653 samples/s/p 3:33:57 } +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1028/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.982643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43177 samples/s/p 3:34:05 } +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1030/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.9820483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43057 samples/s/p 3:34:05 } +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1032/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.9814537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43274 samples/s/p 3:33:57 } +2024-07-25 21:36:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1034/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.980859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43751 samples/s/p 3:33:43 } +2024-07-25 21:36:39,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.9802641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:39,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43320 samples/s/p 3:33:50 } +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1038/ 1625], loss: 1.288, per_step_time: 1470ms, lr: 1.9796691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43934 samples/s/p 3:33:33 } +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1040/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.9790741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43219 samples/s/p 3:33:47 } +2024-07-25 21:36:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1042/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.978479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:48,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43755 samples/s/p 3:33:31 } +2024-07-25 21:36:51,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1044/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.977884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43939 samples/s/p 3:33:24 } +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1046/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.9772886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43343 samples/s/p 3:33:35 } +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1048/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.9766934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43850 samples/s/p 3:33:20 } +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1050/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.9760979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43669 samples/s/p 3:33:21 } +2024-07-25 21:37:02,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1052/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.9755025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:02,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43007 samples/s/p 3:33:34 } +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1054/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 1.974907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43508 samples/s/p 3:33:19 } +2024-07-25 21:37:08,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1056/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.9743113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43288 samples/s/p 3:33:22 } +2024-07-25 21:37:11,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1058/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.9737156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43246 samples/s/p 3:33:20 } +2024-07-25 21:37:14,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1060/ 1625], loss: 1.250, per_step_time: 1481ms, lr: 1.9731197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.40137 samples/s/p 3:34:30 } +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1062/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.972524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43348 samples/s/p 3:33:11 } +2024-07-25 21:37:20,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1064/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.9719278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:20,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.42884 samples/s/p 3:33:19 } +2024-07-25 21:37:23,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1066/ 1625], loss: 1.407, per_step_time: 1471ms, lr: 1.971332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43624 samples/s/p 3:32:59 } +2024-07-25 21:37:26,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1068/ 1625], loss: 0.973, per_step_time: 1472ms, lr: 1.9707357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43392 samples/s/p 3:33:01 } +2024-07-25 21:37:29,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1070/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 1.9701396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:29,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.42763 samples/s/p 3:33:13 } +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1072/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 1.9695433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43959 samples/s/p 3:32:42 } +2024-07-25 21:37:35,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1074/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.968947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:35,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43696 samples/s/p 3:32:45 } +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1076/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9683506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43540 samples/s/p 3:32:46 } +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1078/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 1.967754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43082 samples/s/p 3:32:54 } +2024-07-25 21:37:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1080/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 1.9671574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:44,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43852 samples/s/p 3:32:33 } +2024-07-25 21:37:47,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1082/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.966561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:47,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43775 samples/s/p 3:32:32 } +2024-07-25 21:37:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1084/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.9659641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:50,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43298 samples/s/p 3:32:40 } +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1086/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.9653671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43537 samples/s/p 3:32:32 } +2024-07-25 21:37:56,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1088/ 1625], loss: 0.941, per_step_time: 1472ms, lr: 1.9647705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43317 samples/s/p 3:32:34 } +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1090/ 1625], loss: 1.373, per_step_time: 1472ms, lr: 1.9641735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43282 samples/s/p 3:32:32 } +2024-07-25 21:38:02,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1092/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.9635765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:02,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.44000 samples/s/p 3:32:12 } +2024-07-25 21:38:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1094/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 1.9629793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43788 samples/s/p 3:32:14 } +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1096/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.9623822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43499 samples/s/p 3:32:18 } +2024-07-25 21:38:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1098/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.961785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43405 samples/s/p 3:32:17 } +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1100/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.9611876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43001 samples/s/p 3:32:23 } +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1102/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.9605903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43440 samples/s/p 3:32:10 } +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1104/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.9599927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43894 samples/s/p 3:31:57 } +2024-07-25 21:38:22,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1106/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.9593952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43217 samples/s/p 3:32:10 } +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1108/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 1.9587973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.44399 samples/s/p 3:31:39 } +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1110/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 1.9581998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43537 samples/s/p 3:31:56 } +2024-07-25 21:38:31,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1112/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 1.9576019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:31,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43065 samples/s/p 3:32:04 } +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1114/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.957004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42803 samples/s/p 3:32:07 } +2024-07-25 21:38:37,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1116/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.956406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:37,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43636 samples/s/p 3:31:45 } +2024-07-25 21:38:40,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1118/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.955808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43606 samples/s/p 3:31:43 } +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1120/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.95521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42991 samples/s/p 3:31:54 } +2024-07-25 21:38:46,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1122/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.954612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:46,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43621 samples/s/p 3:31:37 } +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1124/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.9540135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43216 samples/s/p 3:31:43 } +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1126/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.9534153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42899 samples/s/p 3:31:48 } +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1128/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.9528168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43101 samples/s/p 3:31:40 } +2024-07-25 21:38:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1130/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 1.9522184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43976 samples/s/p 3:31:17 } +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1132/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.95162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43481 samples/s/p 3:31:25 } +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1134/ 1625], loss: 1.303, per_step_time: 1470ms, lr: 1.9510213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43889 samples/s/p 3:31:13 } +2024-07-25 21:39:06,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1136/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.9504225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:06,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43604 samples/s/p 3:31:16 } +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1138/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9498239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43516 samples/s/p 3:31:15 } +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1140/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.949225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43667 samples/s/p 3:31:09 } +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1142/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.948626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43656 samples/s/p 3:31:06 } +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1144/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.948027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43231 samples/s/p 3:31:13 } +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1146/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.947428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43669 samples/s/p 3:31:00 } +2024-07-25 21:39:24,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1148/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.9468289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.42943 samples/s/p 3:31:14 } +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1150/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.9462297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43418 samples/s/p 3:31:00 } +2024-07-25 21:39:30,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1152/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.9456304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43559 samples/s/p 3:30:54 } +2024-07-25 21:39:33,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1154/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.9450312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:33,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43727 samples/s/p 3:30:47 } +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1156/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.9444315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43541 samples/s/p 3:30:48 } +2024-07-25 21:39:39,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1158/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.9438321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43786 samples/s/p 3:30:40 } +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1160/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.9432326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43984 samples/s/p 3:30:32 } +2024-07-25 21:39:45,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1162/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.942633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:45,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.44143 samples/s/p 3:30:26 } +2024-07-25 21:39:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1164/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.942033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43117 samples/s/p 3:30:46 } +2024-07-25 21:39:51,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1166/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.9414336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:51,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43710 samples/s/p 3:30:30 } +2024-07-25 21:39:54,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1168/ 1625], loss: 1.320, per_step_time: 1470ms, lr: 1.9408335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:54,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43935 samples/s/p 3:30:22 } +2024-07-25 21:39:57,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1170/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.9402336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43453 samples/s/p 3:30:30 } +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1172/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 1.9396337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43011 samples/s/p 3:30:37 } +2024-07-25 21:40:03,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1174/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.9390336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:03,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43055 samples/s/p 3:30:33 } +2024-07-25 21:40:05,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1176/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9384335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:05,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43682 samples/s/p 3:30:16 } +2024-07-25 21:40:08,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1178/ 1625], loss: 1.039, per_step_time: 1474ms, lr: 1.9378333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:08,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.42586 samples/s/p 3:30:38 } +2024-07-25 21:40:11,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1180/ 1625], loss: 1.450, per_step_time: 1471ms, lr: 1.9372328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43501 samples/s/p 3:30:14 } +2024-07-25 21:40:14,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1182/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 1.9366327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43842 samples/s/p 3:30:03 } +2024-07-25 21:40:17,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 1.9360323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43473 samples/s/p 3:30:09 } +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1186/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.9354316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:20,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43756 samples/s/p 3:29:59 } +2024-07-25 21:40:23,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1188/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 1.934831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.44564 samples/s/p 3:29:38 } +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1190/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.9342304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43422 samples/s/p 3:30:01 } +2024-07-25 21:40:29,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1192/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.9336298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43721 samples/s/p 3:29:51 } +2024-07-25 21:40:32,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1194/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.933029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43292 samples/s/p 3:29:58 } +2024-07-25 21:40:35,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1196/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.9324281e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43105 samples/s/p 3:30:00 } +2024-07-25 21:40:38,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1198/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.9318273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:38,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43272 samples/s/p 3:29:53 } +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1200/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.9312261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43286 samples/s/p 3:29:50 } +2024-07-25 21:40:44,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1202/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.930625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:44,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44036 samples/s/p 3:29:29 } +2024-07-25 21:40:47,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1204/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.930024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.42913 samples/s/p 3:29:52 } +2024-07-25 21:40:50,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1206/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.9294228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:50,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44207 samples/s/p 3:29:19 } +2024-07-25 21:40:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1208/ 1625], loss: 0.975, per_step_time: 1469ms, lr: 1.9288214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44301 samples/s/p 3:29:14 } +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1210/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.92822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43478 samples/s/p 3:29:30 } +2024-07-25 21:40:59,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1212/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.9276187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44153 samples/s/p 3:29:12 } +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1214/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.9270172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43366 samples/s/p 3:29:27 } +2024-07-25 21:41:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1216/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.9264156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43410 samples/s/p 3:29:23 } +2024-07-25 21:41:07,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1218/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.925814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43495 samples/s/p 3:29:18 } +2024-07-25 21:41:10,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1220/ 1625], loss: 1.007, per_step_time: 1473ms, lr: 1.9252126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:10,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.42899 samples/s/p 3:29:29 } +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1222/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9246108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43599 samples/s/p 3:29:10 } +2024-07-25 21:41:16,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1224/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.9240086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43840 samples/s/p 3:29:01 } +2024-07-25 21:41:19,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1226/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.9234069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:19,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44264 samples/s/p 3:28:49 } +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1228/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.922805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43488 samples/s/p 3:29:04 } +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1230/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.9222029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.44082 samples/s/p 3:28:47 } +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1232/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9216008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43819 samples/s/p 3:28:50 } +2024-07-25 21:41:31,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1234/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.9209985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43524 samples/s/p 3:28:54 } +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1236/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.9203962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43641 samples/s/p 3:28:48 } +2024-07-25 21:41:37,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1238/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.919794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43761 samples/s/p 3:28:43 } +2024-07-25 21:41:40,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1240/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.9191915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43404 samples/s/p 3:28:48 } +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1242/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.918589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43401 samples/s/p 3:28:45 } +2024-07-25 21:41:46,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1244/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:46,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.44141 samples/s/p 3:28:25 } +2024-07-25 21:41:49,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1246/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.917384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:49,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43418 samples/s/p 3:28:39 } +2024-07-25 21:41:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1248/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.9167815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43221 samples/s/p 3:28:40 } +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1250/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.9161786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43905 samples/s/p 3:28:22 } +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1252/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.915576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43080 samples/s/p 3:28:38 } +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1254/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.914973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43727 samples/s/p 3:28:20 } +2024-07-25 21:42:03,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1256/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.9143701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:03,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43066 samples/s/p 3:28:32 } +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1258/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.913767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43720 samples/s/p 3:28:14 } +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1260/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.9131641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44203 samples/s/p 3:28:00 } +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1262/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.9125608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43979 samples/s/p 3:28:02 } +2024-07-25 21:42:15,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1264/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.9119578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:15,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.42923 samples/s/p 3:28:24 } +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1266/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.9113546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43540 samples/s/p 3:28:07 } +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1268/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.910751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43981 samples/s/p 3:27:53 } +2024-07-25 21:42:24,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.9101477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43514 samples/s/p 3:28:01 } +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1272/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 1.9095443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43623 samples/s/p 3:27:56 } +2024-07-25 21:42:30,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1274/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.9089408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:30,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43409 samples/s/p 3:27:58 } +2024-07-25 21:42:33,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1276/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.908337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43672 samples/s/p 3:27:49 } +2024-07-25 21:42:36,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1278/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.9077335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42897 samples/s/p 3:28:04 } +2024-07-25 21:42:39,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1280/ 1625], loss: 0.998, per_step_time: 1473ms, lr: 1.9071298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:39,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42927 samples/s/p 3:28:00 } +2024-07-25 21:42:42,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1282/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.9065259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:42,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43656 samples/s/p 3:27:40 } +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1284/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.9059222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43539 samples/s/p 3:27:40 } +2024-07-25 21:42:48,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1286/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.9053183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:48,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.44108 samples/s/p 3:27:24 } +2024-07-25 21:42:51,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1288/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 1.9047144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:51,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43723 samples/s/p 3:27:30 } +2024-07-25 21:42:54,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1290/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9041101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:54,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43789 samples/s/p 3:27:26 } +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1292/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9035058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43580 samples/s/p 3:27:27 } +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1294/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 1.902902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.42674 samples/s/p 3:27:45 } +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1296/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.9022977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43981 samples/s/p 3:27:12 } +2024-07-25 21:43:05,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1298/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 1.9016934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43715 samples/s/p 3:27:15 } +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1300/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.901089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43373 samples/s/p 3:27:20 } +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1302/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.9004845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.42912 samples/s/p 3:27:28 } +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1304/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 1.8998799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43072 samples/s/p 3:27:21 } +2024-07-25 21:43:17,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1306/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 1.8992752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:17,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.44171 samples/s/p 3:26:53 } +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1308/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.8986706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43178 samples/s/p 3:27:13 } +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1310/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 1.8980661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42814 samples/s/p 3:27:18 } +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1312/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.8974612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43727 samples/s/p 3:26:55 } +2024-07-25 21:43:29,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1314/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.8968563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:29,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43572 samples/s/p 3:26:55 } +2024-07-25 21:43:32,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1316/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8962515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42834 samples/s/p 3:27:09 } +2024-07-25 21:43:35,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1318/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.8956465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43625 samples/s/p 3:26:48 } +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1320/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.8950414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43100 samples/s/p 3:26:57 } +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1322/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.8944364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43256 samples/s/p 3:26:51 } +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1324/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8938314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42893 samples/s/p 3:26:56 } +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1326/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.8932262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42925 samples/s/p 3:26:52 } +2024-07-25 21:43:50,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1328/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.8926208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:50,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43190 samples/s/p 3:26:43 } +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.8920155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44125 samples/s/p 3:26:19 } +2024-07-25 21:43:56,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1332/ 1625], loss: 1.164, per_step_time: 1474ms, lr: 1.8914103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:56,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42681 samples/s/p 3:26:49 } +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1334/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.8908046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44065 samples/s/p 3:26:14 } +2024-07-25 21:44:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1336/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 1.890199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43897 samples/s/p 3:26:15 } +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1338/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 1.8895937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43347 samples/s/p 3:26:25 } +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1340/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.888988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43112 samples/s/p 3:26:27 } +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1342/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.888382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43835 samples/s/p 3:26:08 } +2024-07-25 21:44:13,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1344/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.8877763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43334 samples/s/p 3:26:16 } +2024-07-25 21:44:16,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.8871706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:16,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43304 samples/s/p 3:26:14 } +2024-07-25 21:44:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1348/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.8865647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43119 samples/s/p 3:26:15 } +2024-07-25 21:44:22,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1350/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.8859586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43646 samples/s/p 3:26:00 } +2024-07-25 21:44:25,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1352/ 1625], loss: 1.028, per_step_time: 1474ms, lr: 1.8853527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42565 samples/s/p 3:26:22 } +2024-07-25 21:44:28,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1354/ 1625], loss: 0.906, per_step_time: 1472ms, lr: 1.8847466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:28,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43440 samples/s/p 3:25:59 } +2024-07-25 21:44:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1356/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 1.8841405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42764 samples/s/p 3:26:12 } +2024-07-25 21:44:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1358/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.883534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43268 samples/s/p 3:25:57 } +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1360/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.882928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43437 samples/s/p 3:25:51 } +2024-07-25 21:44:40,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1362/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.8823217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43533 samples/s/p 3:25:45 } +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1364/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.8817153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43508 samples/s/p 3:25:43 } +2024-07-25 21:44:46,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1366/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8811088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.42836 samples/s/p 3:25:55 } +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1368/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.8805022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43358 samples/s/p 3:25:41 } +2024-07-25 21:44:52,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1370/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.8798957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.44030 samples/s/p 3:25:22 } +2024-07-25 21:44:55,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1372/ 1625], loss: 1.286, per_step_time: 1469ms, lr: 1.8792889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:55,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.44322 samples/s/p 3:25:13 } +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1374/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.8786823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43503 samples/s/p 3:25:28 } +2024-07-25 21:45:01,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1376/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.8780756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:01,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43144 samples/s/p 3:25:34 } +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1378/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 1.8774688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43778 samples/s/p 3:25:16 } +2024-07-25 21:45:06,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1380/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 1.8768616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43733 samples/s/p 3:25:14 } +2024-07-25 21:45:09,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1382/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 1.876255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43288 samples/s/p 3:25:22 } +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1384/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.875648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43775 samples/s/p 3:25:08 } +2024-07-25 21:45:15,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1386/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 1.8750408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:15,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43188 samples/s/p 3:25:18 } +2024-07-25 21:45:18,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1388/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.8744337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:18,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43220 samples/s/p 3:25:14 } +2024-07-25 21:45:21,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1390/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8738265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:21,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43443 samples/s/p 3:25:06 } +2024-07-25 21:45:24,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1392/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.8732191e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:24,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43311 samples/s/p 3:25:06 } +2024-07-25 21:45:27,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1394/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.872612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:27,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43800 samples/s/p 3:24:52 } +2024-07-25 21:45:30,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1396/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 1.8720046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:30,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43161 samples/s/p 3:25:04 } +2024-07-25 21:45:33,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1398/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.8713974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43220 samples/s/p 3:24:59 } +2024-07-25 21:45:36,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1400/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43112 samples/s/p 3:24:59 } +2024-07-25 21:45:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1402/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.870182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:39,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43453 samples/s/p 3:24:48 } +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1404/ 1625], loss: 0.955, per_step_time: 1470ms, lr: 1.8695746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.44142 samples/s/p 3:24:30 } +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1406/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 1.8689669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.42928 samples/s/p 3:24:54 } +2024-07-25 21:45:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1408/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.8683593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:48,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43360 samples/s/p 3:24:42 } +2024-07-25 21:45:51,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1410/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.8677512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:51,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43910 samples/s/p 3:24:26 } +2024-07-25 21:45:54,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.8671435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43390 samples/s/p 3:24:35 } +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1414/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.8665356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43202 samples/s/p 3:24:36 } +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.8659277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43706 samples/s/p 3:24:22 } +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1418/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.8653196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43009 samples/s/p 3:24:35 } +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1420/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.8647115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43740 samples/s/p 3:24:15 } +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.8641036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43050 samples/s/p 3:24:28 } +2024-07-25 21:46:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1424/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8634952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:11,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43782 samples/s/p 3:24:09 } +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1426/ 1625], loss: 0.986, per_step_time: 1473ms, lr: 1.862887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42791 samples/s/p 3:24:28 } +2024-07-25 21:46:17,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1474ms, lr: 1.8622788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42621 samples/s/p 3:24:29 } +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1430/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.8616704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43190 samples/s/p 3:24:13 } +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1432/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.861062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43553 samples/s/p 3:24:02 } +2024-07-25 21:46:26,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1434/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.8604534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43523 samples/s/p 3:24:00 } +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1436/ 1625], loss: 0.952, per_step_time: 1473ms, lr: 1.859845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42988 samples/s/p 3:24:09 } +2024-07-25 21:46:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1438/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 1.8592364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43086 samples/s/p 3:24:04 } +2024-07-25 21:46:35,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1440/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8586277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:35,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43394 samples/s/p 3:23:54 } +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1442/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.858019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43684 samples/s/p 3:23:44 } +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1444/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.8574103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43329 samples/s/p 3:23:49 } +2024-07-25 21:46:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1446/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.8568015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44104 samples/s/p 3:23:29 } +2024-07-25 21:46:47,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1448/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.8561926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44062 samples/s/p 3:23:27 } +2024-07-25 21:46:50,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1450/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.8555837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:50,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43323 samples/s/p 3:23:41 } +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1452/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 1.8549747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43365 samples/s/p 3:23:37 } +2024-07-25 21:46:56,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1454/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8543657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43861 samples/s/p 3:23:23 } +2024-07-25 21:46:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1456/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.8537567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:59,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43466 samples/s/p 3:23:29 } +2024-07-25 21:47:02,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1458/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.8531473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43421 samples/s/p 3:23:27 } +2024-07-25 21:47:05,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1460/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.8525381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43890 samples/s/p 3:23:13 } +2024-07-25 21:47:07,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1462/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.8519288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43744 samples/s/p 3:23:13 } +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1464/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.8513196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43690 samples/s/p 3:23:12 } +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1466/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.8507104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43752 samples/s/p 3:23:07 } +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1468/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.8501007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.44466 samples/s/p 3:22:48 } +2024-07-25 21:47:19,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1470/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.8494913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:19,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43764 samples/s/p 3:23:01 } +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1472/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.8488818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43142 samples/s/p 3:23:12 } +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1474/ 1625], loss: 1.323, per_step_time: 1469ms, lr: 1.848272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44268 samples/s/p 3:22:44 } +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1476/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.8476625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43218 samples/s/p 3:23:05 } +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1478/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 1.8470528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.42938 samples/s/p 3:23:08 } +2024-07-25 21:47:34,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1480/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 1.846443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:34,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43054 samples/s/p 3:23:02 } +2024-07-25 21:47:37,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1482/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.8458331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44164 samples/s/p 3:22:35 } +2024-07-25 21:47:40,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1484/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.8452232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:40,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43622 samples/s/p 3:22:44 } +2024-07-25 21:47:43,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1486/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 1.8446133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:43,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43108 samples/s/p 3:22:52 } +2024-07-25 21:47:46,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1488/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.8440034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43628 samples/s/p 3:22:38 } +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1490/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 1.8433933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.42691 samples/s/p 3:22:56 } +2024-07-25 21:47:52,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1492/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.8427832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:52,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43789 samples/s/p 3:22:28 } +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1494/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.8421732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43626 samples/s/p 3:22:29 } +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1496/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.841563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43888 samples/s/p 3:22:20 } +2024-07-25 21:48:01,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1498/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.8409528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43713 samples/s/p 3:22:21 } +2024-07-25 21:48:04,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1500/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.8403425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:04,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43472 samples/s/p 3:22:24 } +2024-07-25 21:48:06,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1502/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.839732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43397 samples/s/p 3:22:22 } +2024-07-25 21:48:09,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1504/ 1625], loss: 1.385, per_step_time: 1473ms, lr: 1.8391216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:09,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.42977 samples/s/p 3:22:29 } +2024-07-25 21:48:12,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1506/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8385112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44121 samples/s/p 3:22:00 } +2024-07-25 21:48:15,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1508/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.8379005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43607 samples/s/p 3:22:09 } +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1510/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.8372903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43838 samples/s/p 3:22:01 } +2024-07-25 21:48:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1512/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8366794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43373 samples/s/p 3:22:08 } +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1514/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.8360686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.42957 samples/s/p 3:22:15 } +2024-07-25 21:48:27,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1516/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 1.8354582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44193 samples/s/p 3:21:44 } +2024-07-25 21:48:30,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.8348474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43242 samples/s/p 3:22:02 } +2024-07-25 21:48:33,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1520/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.8342364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:33,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43730 samples/s/p 3:21:48 } +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1522/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.8336255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43550 samples/s/p 3:21:50 } +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1524/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.8330145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43671 samples/s/p 3:21:44 } +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1526/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.8324039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43718 samples/s/p 3:21:40 } +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1528/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.8317924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43397 samples/s/p 3:21:44 } +2024-07-25 21:48:48,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1530/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 1.8311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43548 samples/s/p 3:21:38 } +2024-07-25 21:48:51,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1532/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.8305704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:51,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43790 samples/s/p 3:21:29 } +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1534/ 1625], loss: 0.995, per_step_time: 1470ms, lr: 1.8299592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.44191 samples/s/p 3:21:18 } +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1536/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.8293478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43734 samples/s/p 3:21:25 } +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1538/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 1.8287366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43694 samples/s/p 3:21:23 } +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1540/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 1.8281251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43162 samples/s/p 3:21:32 } +2024-07-25 21:49:05,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1542/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.8275137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:05,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43510 samples/s/p 3:21:21 } +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1544/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.8269022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43493 samples/s/p 3:21:18 } +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1546/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.8262908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43448 samples/s/p 3:21:16 } +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1548/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 1.8256795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43128 samples/s/p 3:21:21 } +2024-07-25 21:49:17,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1550/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.8250676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:17,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43227 samples/s/p 3:21:15 } +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1552/ 1625], loss: 0.950, per_step_time: 1470ms, lr: 1.824456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44074 samples/s/p 3:20:54 } +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1554/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.8238445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43425 samples/s/p 3:21:05 } +2024-07-25 21:49:26,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1556/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.8232326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:26,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43592 samples/s/p 3:20:59 } +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1558/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.8226207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43182 samples/s/p 3:21:05 } +2024-07-25 21:49:32,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1560/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.822009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:32,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43741 samples/s/p 3:20:49 } +2024-07-25 21:49:35,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1562/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 1.8213968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43594 samples/s/p 3:20:50 } +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1564/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 1.820785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.42738 samples/s/p 3:21:06 } +2024-07-25 21:49:41,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1566/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.8201728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:41,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43352 samples/s/p 3:20:49 } +2024-07-25 21:49:44,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1568/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.8195607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44209 samples/s/p 3:20:27 } +2024-07-25 21:49:47,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1570/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.8189487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:47,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43646 samples/s/p 3:20:37 } +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1572/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8183366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43240 samples/s/p 3:20:43 } +2024-07-25 21:49:53,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1574/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.8177245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43342 samples/s/p 3:20:38 } +2024-07-25 21:49:56,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1576/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 1.8171122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43471 samples/s/p 3:20:32 } +2024-07-25 21:49:59,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1578/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 1.8165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:59,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43655 samples/s/p 3:20:25 } +2024-07-25 21:50:02,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1580/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.8158873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:02,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43856 samples/s/p 3:20:17 } +2024-07-25 21:50:04,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1582/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 1.815275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.44024 samples/s/p 3:20:11 } +2024-07-25 21:50:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1584/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.8146626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:07,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43586 samples/s/p 3:20:17 } +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1586/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.8140501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43929 samples/s/p 3:20:07 } +2024-07-25 21:50:13,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1588/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.8134375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:13,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43017 samples/s/p 3:20:24 } +2024-07-25 21:50:16,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1590/ 1625], loss: 1.226, per_step_time: 1469ms, lr: 1.8128248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.44317 samples/s/p 3:19:53 } +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1592/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.8122122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43748 samples/s/p 3:20:02 } +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1594/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 1.8115996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43365 samples/s/p 3:20:08 } +2024-07-25 21:50:25,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1596/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.8109868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43473 samples/s/p 3:20:02 } +2024-07-25 21:50:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1598/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 1.8103741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43484 samples/s/p 3:19:59 } +2024-07-25 21:50:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1600/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.8097613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43170 samples/s/p 3:20:03 } +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1602/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.8091481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43435 samples/s/p 3:19:54 } +2024-07-25 21:50:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1604/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8085353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43346 samples/s/p 3:19:53 } +2024-07-25 21:50:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1606/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.8079225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:40,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43793 samples/s/p 3:19:41 } +2024-07-25 21:50:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1608/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8073093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43592 samples/s/p 3:19:42 } +2024-07-25 21:50:46,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1610/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.8066961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:46,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43789 samples/s/p 3:19:35 } +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1612/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.8060831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43586 samples/s/p 3:19:36 } +2024-07-25 21:50:52,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1614/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.8054698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:52,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43779 samples/s/p 3:19:29 } +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1616/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.8048568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43339 samples/s/p 3:19:36 } +2024-07-25 21:50:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1618/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.8042434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43388 samples/s/p 3:19:32 } +2024-07-25 21:51:01,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1620/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.8036299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:01,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44183 samples/s/p 3:19:11 } +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1622/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8030169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43362 samples/s/p 3:19:26 } +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1624/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.8024031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44246 samples/s/p 3:19:04 } +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.80179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43598 samples/s/p 3:19:15 } +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 3/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.8011764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43709 samples/s/p 3:19:10 } +2024-07-25 21:51:15,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 5/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.8005629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43180 samples/s/p 3:19:19 } +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 7/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.7999491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43900 samples/s/p 3:19:00 } +2024-07-25 21:51:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 9/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.7993356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:21,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43363 samples/s/p 3:19:09 } +2024-07-25 21:51:24,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 11/ 1625], loss: 1.096, per_step_time: 1469ms, lr: 1.7987217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:24,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.44266 samples/s/p 3:18:46 } +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 13/ 1625], loss: 1.056, per_step_time: 1475ms, lr: 1.798108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42037 samples/s/p 3:19:32 } +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 15/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.7974944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43326 samples/s/p 3:19:01 } +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 17/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.7968803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43834 samples/s/p 3:18:47 } +2024-07-25 21:51:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 19/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.7962668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:36,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42985 samples/s/p 3:19:02 } +2024-07-25 21:51:39,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 21/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.7956525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43831 samples/s/p 3:18:41 } +2024-07-25 21:51:42,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 23/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 1.7950388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:42,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43616 samples/s/p 3:18:43 } +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 25/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.7944249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43719 samples/s/p 3:18:37 } +2024-07-25 21:51:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 27/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7938106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43928 samples/s/p 3:18:30 } +2024-07-25 21:51:51,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 29/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7931965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43446 samples/s/p 3:18:38 } +2024-07-25 21:51:54,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 31/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.7925824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:54,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43391 samples/s/p 3:18:36 } +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 33/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.7919681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43170 samples/s/p 3:18:38 } +2024-07-25 21:52:00,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 35/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 1.7913539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:00,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43059 samples/s/p 3:18:37 } +2024-07-25 21:52:03,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 37/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7907396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:03,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43099 samples/s/p 3:18:33 } +2024-07-25 21:52:05,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 39/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 1.7901253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:05,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43403 samples/s/p 3:18:24 } +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 41/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.789511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43454 samples/s/p 3:18:20 } +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 43/ 1625], loss: 1.354, per_step_time: 1470ms, lr: 1.7888964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44173 samples/s/p 3:18:01 } +2024-07-25 21:52:14,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 45/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 1.788282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:14,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43992 samples/s/p 3:18:02 } +2024-07-25 21:52:17,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 47/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.7876677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:17,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43248 samples/s/p 3:18:15 } +2024-07-25 21:52:20,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 49/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.787053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43562 samples/s/p 3:18:06 } +2024-07-25 21:52:23,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 51/ 1625], loss: 1.256, per_step_time: 1474ms, lr: 1.7864384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.42377 samples/s/p 3:18:29 } +2024-07-25 21:52:26,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 53/ 1625], loss: 1.194, per_step_time: 1469ms, lr: 1.7858238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44572 samples/s/p 3:17:38 } +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 55/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7852091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43384 samples/s/p 3:18:01 } +2024-07-25 21:52:32,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 57/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7845947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43581 samples/s/p 3:17:53 } +2024-07-25 21:52:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 59/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.7839797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43148 samples/s/p 3:18:00 } +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 61/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 1.7833649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.42852 samples/s/p 3:18:03 } +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 63/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.78275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43086 samples/s/p 3:17:55 } +2024-07-25 21:52:44,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 65/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.7821352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43974 samples/s/p 3:17:33 } +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 67/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.78152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43787 samples/s/p 3:17:34 } +2024-07-25 21:52:50,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 69/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.7809052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43727 samples/s/p 3:17:33 } +2024-07-25 21:52:53,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 71/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.7802902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43816 samples/s/p 3:17:28 } +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 73/ 1625], loss: 1.242, per_step_time: 1482ms, lr: 1.7796752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.39665 samples/s/p 3:18:56 } +2024-07-25 21:52:59,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 75/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.77906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43963 samples/s/p 3:17:19 } +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 77/ 1625], loss: 0.873, per_step_time: 1470ms, lr: 1.7784449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44149 samples/s/p 3:17:12 } +2024-07-25 21:53:04,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 79/ 1625], loss: 1.275, per_step_time: 1470ms, lr: 1.7778299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43929 samples/s/p 3:17:13 } +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 81/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 1.7772145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44342 samples/s/p 3:17:01 } +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 83/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 1.7765991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43850 samples/s/p 3:17:09 } +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 85/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.775984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43394 samples/s/p 3:17:16 } +2024-07-25 21:53:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 87/ 1625], loss: 1.158, per_step_time: 1469ms, lr: 1.7753686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44372 samples/s/p 3:16:52 } +2024-07-25 21:53:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 89/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.774753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:19,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43326 samples/s/p 3:17:12 } +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 91/ 1625], loss: 1.184, per_step_time: 1469ms, lr: 1.7741377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.44290 samples/s/p 3:16:48 } +2024-07-25 21:53:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 93/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.7735223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:25,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43422 samples/s/p 3:17:04 } +2024-07-25 21:53:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 95/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.7729066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:28,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43280 samples/s/p 3:17:04 } +2024-07-25 21:53:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 97/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.772291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:31,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43098 samples/s/p 3:17:05 } +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 99/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.7716755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:34,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43067 samples/s/p 3:17:03 } +2024-07-25 21:53:37,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 101/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.77106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43871 samples/s/p 3:16:42 } +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 103/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.7704442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43725 samples/s/p 3:16:43 } +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 105/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 1.7698285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43452 samples/s/p 3:16:46 } +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 107/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7692128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43970 samples/s/p 3:16:31 } +2024-07-25 21:53:49,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 109/ 1625], loss: 1.241, per_step_time: 1470ms, lr: 1.768597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43920 samples/s/p 3:16:29 } +2024-07-25 21:53:52,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 111/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.767981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:52,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43456 samples/s/p 3:16:37 } +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 113/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 1.7673652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43542 samples/s/p 3:16:32 } +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 115/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7667493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43004 samples/s/p 3:16:41 } +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 117/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.7661332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43237 samples/s/p 3:16:33 } +2024-07-25 21:54:03,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 119/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.7655173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:03,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43408 samples/s/p 3:16:26 } +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 121/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.764901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.42948 samples/s/p 3:16:33 } +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 123/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 1.7642853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43111 samples/s/p 3:16:26 } +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.763669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43050 samples/s/p 3:16:25 } +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 127/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 1.7630528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43857 samples/s/p 3:16:04 } +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 129/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.7624367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43099 samples/s/p 3:16:18 } +2024-07-25 21:54:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 131/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.7618206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43167 samples/s/p 3:16:13 } +2024-07-25 21:54:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 133/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.761204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.42939 samples/s/p 3:16:15 } +2024-07-25 21:54:27,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 135/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7605877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43304 samples/s/p 3:16:05 } +2024-07-25 21:54:30,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 137/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.7599716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:30,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43164 samples/s/p 3:16:05 } +2024-07-25 21:54:33,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 139/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.759355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43769 samples/s/p 3:15:49 } +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 141/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.7587385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43766 samples/s/p 3:15:46 } +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 143/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7581222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43667 samples/s/p 3:15:45 } +2024-07-25 21:54:42,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 145/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.7575056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43761 samples/s/p 3:15:40 } +2024-07-25 21:54:45,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 147/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.756889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43426 samples/s/p 3:15:44 } +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 149/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.7562725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43531 samples/s/p 3:15:39 } +2024-07-25 21:54:51,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 151/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.7556558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43564 samples/s/p 3:15:35 } +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 153/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.7550392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43738 samples/s/p 3:15:29 } +2024-07-25 21:54:57,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 155/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.7544224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:57,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43263 samples/s/p 3:15:36 } +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 157/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 1.7538056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.41711 samples/s/p 3:16:07 } +2024-07-25 21:55:03,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 159/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.753189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:03,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43743 samples/s/p 3:15:20 } +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 161/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.7525721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43303 samples/s/p 3:15:26 } +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 163/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.7519553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43432 samples/s/p 3:15:21 } +2024-07-25 21:55:11,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 165/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7513383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43726 samples/s/p 3:15:11 } +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 167/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.7507215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43025 samples/s/p 3:15:23 } +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 169/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.7501043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43328 samples/s/p 3:15:14 } +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 171/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7494875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43455 samples/s/p 3:15:08 } +2024-07-25 21:55:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 173/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.7488705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43545 samples/s/p 3:15:03 } +2024-07-25 21:55:26,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 175/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.7482535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:26,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.44280 samples/s/p 3:14:45 } +2024-07-25 21:55:29,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 177/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.7476359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43517 samples/s/p 3:14:58 } +2024-07-25 21:55:32,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 179/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.747019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42801 samples/s/p 3:15:11 } +2024-07-25 21:55:35,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 181/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.7464017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43208 samples/s/p 3:14:59 } +2024-07-25 21:55:38,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 183/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.7457845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:38,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43572 samples/s/p 3:14:48 } +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 185/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 1.7451674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42554 samples/s/p 3:15:07 } +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 187/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.74455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43272 samples/s/p 3:14:49 } +2024-07-25 21:55:47,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 189/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 1.7439326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:47,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43745 samples/s/p 3:14:36 } +2024-07-25 21:55:50,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 191/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.7433153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43780 samples/s/p 3:14:32 } +2024-07-25 21:55:53,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 193/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7426979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:53,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43379 samples/s/p 3:14:38 } +2024-07-25 21:55:56,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 195/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.7420805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:56,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43664 samples/s/p 3:14:28 } +2024-07-25 21:55:59,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 197/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.741463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:59,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44038 samples/s/p 3:14:18 } +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 199/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.7408454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43571 samples/s/p 3:14:25 } +2024-07-25 21:56:05,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 201/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.740228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:05,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43203 samples/s/p 3:14:30 } +2024-07-25 21:56:07,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 203/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.7396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:07,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44071 samples/s/p 3:14:08 } +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 205/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.7389928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.42973 samples/s/p 3:14:29 } +2024-07-25 21:56:13,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 207/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7383752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:13,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43590 samples/s/p 3:14:12 } +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 209/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.7377573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:16,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43658 samples/s/p 3:14:08 } +2024-07-25 21:56:19,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 211/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.7371396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43294 samples/s/p 3:14:13 } +2024-07-25 21:56:22,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 213/ 1625], loss: 1.324, per_step_time: 1473ms, lr: 1.7365219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:22,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43098 samples/s/p 3:14:14 } +2024-07-25 21:56:25,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 215/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.735904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:25,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43332 samples/s/p 3:14:06 } +2024-07-25 21:56:28,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 217/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.7352862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:28,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43098 samples/s/p 3:14:08 } +2024-07-25 21:56:31,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 219/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 1.7346685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43476 samples/s/p 3:13:57 } +2024-07-25 21:56:34,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 221/ 1625], loss: 1.076, per_step_time: 1473ms, lr: 1.7340506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42896 samples/s/p 3:14:07 } +2024-07-25 21:56:37,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 223/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.7334327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:37,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43343 samples/s/p 3:13:54 } +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 225/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.7328146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43854 samples/s/p 3:13:40 } +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 227/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.7321967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42566 samples/s/p 3:14:05 } +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 229/ 1625], loss: 0.899, per_step_time: 1472ms, lr: 1.7315788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43442 samples/s/p 3:13:43 } +2024-07-25 21:56:49,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 231/ 1625], loss: 0.989, per_step_time: 1469ms, lr: 1.7309607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:49,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.44338 samples/s/p 3:13:21 } +2024-07-25 21:56:52,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 233/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7303424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43717 samples/s/p 3:13:31 } +2024-07-25 21:56:55,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 235/ 1625], loss: 1.290, per_step_time: 1470ms, lr: 1.7297245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:55,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43871 samples/s/p 3:13:25 } +2024-07-25 21:56:58,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 237/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.729106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43983 samples/s/p 3:13:20 } +2024-07-25 21:57:01,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 239/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.728488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43130 samples/s/p 3:13:35 } +2024-07-25 21:57:04,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 241/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.7278699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43241 samples/s/p 3:13:30 } +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 243/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.7272516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43184 samples/s/p 3:13:28 } +2024-07-25 21:57:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 245/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.7266331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43911 samples/s/p 3:13:10 } +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 247/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7260149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44085 samples/s/p 3:13:03 } +2024-07-25 21:57:15,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 249/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.7253966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43788 samples/s/p 3:13:06 } +2024-07-25 21:57:18,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 251/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.7247781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44200 samples/s/p 3:12:55 } +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 253/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.7241597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43170 samples/s/p 3:13:14 } +2024-07-25 21:57:24,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 255/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.7235412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:24,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.44060 samples/s/p 3:12:52 } +2024-07-25 21:57:27,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 257/ 1625], loss: 1.069, per_step_time: 1474ms, lr: 1.722923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.42445 samples/s/p 3:13:23 } +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 259/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 1.7223043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43991 samples/s/p 3:12:47 } +2024-07-25 21:57:33,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 261/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.7216857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:33,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43176 samples/s/p 3:13:02 } +2024-07-25 21:57:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 263/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 1.7210672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:36,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43783 samples/s/p 3:12:46 } +2024-07-25 21:57:39,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 265/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.7204486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43807 samples/s/p 3:12:42 } +2024-07-25 21:57:42,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 267/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.7198297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:42,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43351 samples/s/p 3:12:49 } +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 269/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.7192113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43661 samples/s/p 3:12:40 } +2024-07-25 21:57:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 271/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 1.7185926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:48,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43434 samples/s/p 3:12:42 } +2024-07-25 21:57:51,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 273/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 1.7179738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:51,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43812 samples/s/p 3:12:31 } +2024-07-25 21:57:54,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 275/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 1.717355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43765 samples/s/p 3:12:29 } +2024-07-25 21:57:54,186 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 277/ 1625], loss: 1.121, per_step_time: 3167ms, lr: 1.7167362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 2.52574 samples/s/p 6:54:17 } +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 279/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.7161175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.42974 samples/s/p 3:12:40 } +2024-07-25 21:58:35,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 281/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.7154985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:36,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43717 samples/s/p 3:12:21 } +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 283/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.7148795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43792 samples/s/p 3:12:16 } +2024-07-25 21:58:42,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 285/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.7142607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44062 samples/s/p 3:12:08 } +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 287/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.7136417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43227 samples/s/p 3:12:22 } +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 289/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.7130225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43840 samples/s/p 3:12:06 } +2024-07-25 21:58:50,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 291/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.7124037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:50,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43349 samples/s/p 3:12:14 } +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 293/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 1.7117847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44054 samples/s/p 3:11:56 } +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 295/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 1.7111655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43866 samples/s/p 3:11:57 } +2024-07-25 21:58:59,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 297/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.7105465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:59,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43765 samples/s/p 3:11:56 } +2024-07-25 21:59:02,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 299/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.7099273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:02,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43478 samples/s/p 3:11:59 } +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 301/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 1.7093083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44093 samples/s/p 3:11:43 } +2024-07-25 21:59:08,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 303/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.708689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43537 samples/s/p 3:11:52 } +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 305/ 1625], loss: 1.362, per_step_time: 1469ms, lr: 1.7080698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44533 samples/s/p 3:11:28 } +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 307/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.7074506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43648 samples/s/p 3:11:44 } +2024-07-25 21:59:17,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 309/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.7068312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43515 samples/s/p 3:11:44 } +2024-07-25 21:59:20,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 311/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.7062119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:20,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43889 samples/s/p 3:11:33 } +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 313/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.7055927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43687 samples/s/p 3:11:34 } +2024-07-25 21:59:26,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 315/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 1.7049733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:26,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43234 samples/s/p 3:11:41 } +2024-07-25 21:59:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 317/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.704354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:29,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43241 samples/s/p 3:11:38 } +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 319/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.7037344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43812 samples/s/p 3:11:23 } +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1474ms, lr: 1.703115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.42539 samples/s/p 3:11:47 } +2024-07-25 21:59:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 323/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.7024955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43359 samples/s/p 3:11:27 } +2024-07-25 21:59:41,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 325/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 1.701876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:41,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43856 samples/s/p 3:11:13 } +2024-07-25 21:59:44,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 327/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.7012564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43597 samples/s/p 3:11:16 } +2024-07-25 21:59:46,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 329/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.7006369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.44048 samples/s/p 3:11:03 } +2024-07-25 21:59:49,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 331/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.7000175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:49,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43358 samples/s/p 3:11:15 } +2024-07-25 21:59:52,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 333/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.6993976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:52,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43666 samples/s/p 3:11:05 } +2024-07-25 21:59:55,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 335/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.698778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:55,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43774 samples/s/p 3:11:00 } +2024-07-25 21:59:58,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 337/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 1.6981583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:58,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43981 samples/s/p 3:10:53 } +2024-07-25 22:00:01,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 339/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.6975388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43689 samples/s/p 3:10:56 } +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 341/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.6969188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43769 samples/s/p 3:10:51 } +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 343/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.6962991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43682 samples/s/p 3:10:50 } +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 345/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.6956794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43942 samples/s/p 3:10:42 } +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 347/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6950595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43184 samples/s/p 3:10:55 } +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 349/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.6944396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43818 samples/s/p 3:10:39 } +2024-07-25 22:00:19,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 351/ 1625], loss: 1.214, per_step_time: 1470ms, lr: 1.69382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43858 samples/s/p 3:10:35 } +2024-07-25 22:00:22,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 353/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.6932001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43320 samples/s/p 3:10:43 } +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 355/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.69258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43754 samples/s/p 3:10:31 } +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 357/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.6919603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43533 samples/s/p 3:10:33 } +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 359/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.6913402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43688 samples/s/p 3:10:27 } +2024-07-25 22:00:34,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 361/ 1625], loss: 1.336, per_step_time: 1471ms, lr: 1.6907201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:34,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43546 samples/s/p 3:10:27 } +2024-07-25 22:00:37,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 363/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.6901002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:37,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43983 samples/s/p 3:10:15 } +2024-07-25 22:00:40,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 365/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.68948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:40,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43555 samples/s/p 3:10:21 } +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 367/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.68886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43286 samples/s/p 3:10:23 } +2024-07-25 22:00:45,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 369/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.6882399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43485 samples/s/p 3:10:16 } +2024-07-25 22:00:48,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 371/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.6876196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:48,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43536 samples/s/p 3:10:12 } +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 373/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 1.6869997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42488 samples/s/p 3:10:31 } +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 375/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.6863796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:54,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42825 samples/s/p 3:10:21 } +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 377/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.6857595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43874 samples/s/p 3:09:56 } +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 379/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.685139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43113 samples/s/p 3:10:09 } +2024-07-25 22:01:03,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 381/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.6845188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:03,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43560 samples/s/p 3:09:57 } +2024-07-25 22:01:06,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 383/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.6838985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:06,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43082 samples/s/p 3:10:04 } +2024-07-25 22:01:09,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 385/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.6832782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:09,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42945 samples/s/p 3:10:04 } +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 387/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.682658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42774 samples/s/p 3:10:05 } +2024-07-25 22:01:15,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 389/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.6820375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43524 samples/s/p 3:09:46 } +2024-07-25 22:01:18,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 391/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.6814174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43274 samples/s/p 3:09:48 } +2024-07-25 22:01:21,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 393/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.6807968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43851 samples/s/p 3:09:33 } +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 395/ 1625], loss: 1.084, per_step_time: 1479ms, lr: 1.6801763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.40652 samples/s/p 3:10:38 } +2024-07-25 22:01:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 397/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.679556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43670 samples/s/p 3:09:31 } +2024-07-25 22:01:30,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 399/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6789356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43449 samples/s/p 3:09:33 } +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 401/ 1625], loss: 1.224, per_step_time: 1475ms, lr: 1.678315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.42131 samples/s/p 3:09:57 } +2024-07-25 22:01:36,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 403/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 1.6776945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:36,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43988 samples/s/p 3:09:16 } +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 405/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.6770739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43896 samples/s/p 3:09:15 } +2024-07-25 22:01:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 407/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.6764534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43360 samples/s/p 3:09:23 } +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 409/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6758328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43488 samples/s/p 3:09:17 } +2024-07-25 22:01:48,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 411/ 1625], loss: 1.214, per_step_time: 1483ms, lr: 1.6752121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:48,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.39225 samples/s/p 3:10:44 } +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 413/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.6745917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43781 samples/s/p 3:09:05 } +2024-07-25 22:01:53,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 415/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.6739708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:53,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43433 samples/s/p 3:09:10 } +2024-07-25 22:01:56,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 417/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.6733502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:56,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43971 samples/s/p 3:08:55 } +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 419/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.6727296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42989 samples/s/p 3:09:13 } +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 421/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.672109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43481 samples/s/p 3:09:00 } +2024-07-25 22:02:05,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 423/ 1625], loss: 1.291, per_step_time: 1474ms, lr: 1.671488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42604 samples/s/p 3:09:15 } +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 425/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.6708673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43720 samples/s/p 3:08:49 } +2024-07-25 22:02:11,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 427/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.6702465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:11,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43776 samples/s/p 3:08:45 } +2024-07-25 22:02:14,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 429/ 1625], loss: 1.089, per_step_time: 1473ms, lr: 1.6696256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:14,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42969 samples/s/p 3:08:59 } +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 431/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 1.6690048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.42732 samples/s/p 3:09:01 } +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 433/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.6683838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43129 samples/s/p 3:08:49 } +2024-07-25 22:02:23,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 435/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 1.6677632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43518 samples/s/p 3:08:38 } +2024-07-25 22:02:26,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 437/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.6671422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:26,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43290 samples/s/p 3:08:40 } +2024-07-25 22:02:29,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 439/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.6665212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:29,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43313 samples/s/p 3:08:37 } +2024-07-25 22:02:32,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 1.6659005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.44233 samples/s/p 3:08:15 } +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 443/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 1.6652793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43917 samples/s/p 3:08:18 } +2024-07-25 22:02:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 445/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.6646582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:38,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43634 samples/s/p 3:08:21 } +2024-07-25 22:02:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 447/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.6640375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43113 samples/s/p 3:08:29 } +2024-07-25 22:02:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 449/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6634163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43273 samples/s/p 3:08:23 } +2024-07-25 22:02:47,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 451/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.6627953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:47,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43651 samples/s/p 3:08:12 } +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 453/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.6621743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43116 samples/s/p 3:08:20 } +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 455/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.661553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43552 samples/s/p 3:08:08 } +2024-07-25 22:02:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 457/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 1.6609321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:55,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43567 samples/s/p 3:08:05 } +2024-07-25 22:02:58,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 459/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 1.6603108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43384 samples/s/p 3:08:06 } +2024-07-25 22:03:01,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 461/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.6596896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:01,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.44245 samples/s/p 3:07:45 } +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 463/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6590686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43534 samples/s/p 3:07:57 } +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 465/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 1.6584474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.42910 samples/s/p 3:08:07 } +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 467/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.657826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43619 samples/s/p 3:07:49 } +2024-07-25 22:03:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 469/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.6572048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43934 samples/s/p 3:07:40 } +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 471/ 1625], loss: 1.016, per_step_time: 1473ms, lr: 1.6565837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43049 samples/s/p 3:07:55 } +2024-07-25 22:03:19,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 473/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.6559625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43190 samples/s/p 3:07:49 } +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 475/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.6553411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:22,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43353 samples/s/p 3:07:43 } +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 477/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.6547197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43654 samples/s/p 3:07:34 } +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 479/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.6540986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43616 samples/s/p 3:07:32 } +2024-07-25 22:03:31,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 481/ 1625], loss: 1.252, per_step_time: 1477ms, lr: 1.653477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:31,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.41631 samples/s/p 3:08:10 } +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 483/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.6528556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43149 samples/s/p 3:07:35 } +2024-07-25 22:03:37,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 485/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.6522345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:37,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43571 samples/s/p 3:07:24 } +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 487/ 1625], loss: 1.072, per_step_time: 1484ms, lr: 1.651613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.38918 samples/s/p 3:08:58 } +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 489/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.6509914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43197 samples/s/p 3:07:26 } +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 491/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.6503702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43708 samples/s/p 3:07:12 } +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 1.6497484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43860 samples/s/p 3:07:06 } +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 495/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.649127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43815 samples/s/p 3:07:04 } +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 497/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 1.6485055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43696 samples/s/p 3:07:03 } +2024-07-25 22:03:57,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 499/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.6478842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43664 samples/s/p 3:07:01 } +2024-07-25 22:04:00,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.6472628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.42413 samples/s/p 3:07:24 } +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 503/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.6466409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43937 samples/s/p 3:06:50 } +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 505/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.6460193e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43199 samples/s/p 3:07:02 } +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 507/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.645398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.44074 samples/s/p 3:06:41 } +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 509/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.6447762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43230 samples/s/p 3:06:55 } +2024-07-25 22:04:15,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 511/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.6441545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:15,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43284 samples/s/p 3:06:51 } +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 513/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 1.6435331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43631 samples/s/p 3:06:41 } +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 515/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.6429112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43650 samples/s/p 3:06:38 } +2024-07-25 22:04:24,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 517/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.6422895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:24,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43331 samples/s/p 3:06:42 } +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 519/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.641668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43128 samples/s/p 3:06:43 } +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 521/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 1.6410462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43611 samples/s/p 3:06:30 } +2024-07-25 22:04:33,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 523/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.6404245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43356 samples/s/p 3:06:32 } +2024-07-25 22:04:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 525/ 1625], loss: 1.376, per_step_time: 1473ms, lr: 1.6398028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:36,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.42799 samples/s/p 3:06:41 } +2024-07-25 22:04:39,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 527/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 1.639181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43050 samples/s/p 3:06:33 } +2024-07-25 22:04:42,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 529/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 1.6385593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:42,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44067 samples/s/p 3:06:09 } +2024-07-25 22:04:45,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 531/ 1625], loss: 1.436, per_step_time: 1473ms, lr: 1.6379374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:45,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43097 samples/s/p 3:06:26 } +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 533/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 1.6373155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43835 samples/s/p 3:06:08 } +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 535/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 1.6366937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43885 samples/s/p 3:06:04 } +2024-07-25 22:04:53,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 537/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.636072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:53,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44116 samples/s/p 3:05:56 } +2024-07-25 22:04:56,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 539/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.6354501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43809 samples/s/p 3:05:59 } +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 541/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 1.6348282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43374 samples/s/p 3:06:05 } +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 543/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.6342063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43222 samples/s/p 3:06:05 } +2024-07-25 22:05:05,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 545/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6335844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.44062 samples/s/p 3:05:45 } +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 547/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.6329626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43230 samples/s/p 3:05:59 } +2024-07-25 22:05:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 549/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.6323405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43532 samples/s/p 3:05:50 } +2024-07-25 22:05:14,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 551/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.6317186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:14,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43800 samples/s/p 3:05:42 } +2024-07-25 22:05:17,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 553/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 1.6310967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:17,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42398 samples/s/p 3:06:08 } +2024-07-25 22:05:20,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 555/ 1625], loss: 1.357, per_step_time: 1471ms, lr: 1.6304746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43816 samples/s/p 3:05:36 } +2024-07-25 22:05:23,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 557/ 1625], loss: 1.058, per_step_time: 1475ms, lr: 1.6298527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42168 samples/s/p 3:06:07 } +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 559/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.6292306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43559 samples/s/p 3:05:35 } +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 561/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.6286087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42770 samples/s/p 3:05:48 } +2024-07-25 22:05:32,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 563/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.6279866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:32,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43642 samples/s/p 3:05:27 } +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 565/ 1625], loss: 0.905, per_step_time: 1471ms, lr: 1.6273645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43584 samples/s/p 3:05:26 } +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 567/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 1.6267424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43002 samples/s/p 3:05:35 } +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 569/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.6261205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43229 samples/s/p 3:05:27 } +2024-07-25 22:05:44,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 571/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6254982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43932 samples/s/p 3:05:10 } +2024-07-25 22:05:47,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 573/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.6248761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.44027 samples/s/p 3:05:05 } +2024-07-25 22:05:50,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 575/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.6242542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:50,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42728 samples/s/p 3:05:28 } +2024-07-25 22:05:53,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 577/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 1.623632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:53,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43218 samples/s/p 3:05:15 } +2024-07-25 22:05:55,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 579/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.6230098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:55,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43294 samples/s/p 3:05:11 } +2024-07-25 22:05:58,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 581/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.6223876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:58,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.42790 samples/s/p 3:05:18 } +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 583/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.6217655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43548 samples/s/p 3:05:00 } +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 585/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.6211432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43335 samples/s/p 3:05:01 } +2024-07-25 22:06:07,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 587/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6205211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:07,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43716 samples/s/p 3:04:51 } +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 589/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.6198988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43874 samples/s/p 3:04:44 } +2024-07-25 22:06:13,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 591/ 1625], loss: 0.934, per_step_time: 1470ms, lr: 1.6192767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.44076 samples/s/p 3:04:37 } +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 593/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.6186543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43808 samples/s/p 3:04:40 } +2024-07-25 22:06:19,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.618032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43162 samples/s/p 3:04:50 } +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 597/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.6174099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43887 samples/s/p 3:04:32 } +2024-07-25 22:06:25,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 599/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.6167876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:25,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.44003 samples/s/p 3:04:27 } +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 601/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.6161654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43547 samples/s/p 3:04:33 } +2024-07-25 22:06:31,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 603/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6155429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43475 samples/s/p 3:04:32 } +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 605/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 1.6149206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43789 samples/s/p 3:04:23 } +2024-07-25 22:06:37,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 607/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.6142983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:37,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43366 samples/s/p 3:04:28 } +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 609/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.6136759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43399 samples/s/p 3:04:25 } +2024-07-25 22:06:43,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 611/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6130536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:43,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43961 samples/s/p 3:04:10 } +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 613/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.6124313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43121 samples/s/p 3:04:24 } +2024-07-25 22:06:49,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 615/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.6118087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44068 samples/s/p 3:04:02 } +2024-07-25 22:06:52,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 617/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6111862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:52,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44073 samples/s/p 3:03:59 } +2024-07-25 22:06:54,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1475ms, lr: 1.6105641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:54,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42278 samples/s/p 3:04:33 } +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 621/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 1.6099417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43004 samples/s/p 3:04:15 } +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 623/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.609319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43458 samples/s/p 3:04:03 } +2024-07-25 22:07:03,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 625/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.6086968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43410 samples/s/p 3:04:01 } +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 627/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.6080743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43501 samples/s/p 3:03:56 } +2024-07-25 22:07:09,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 629/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.6074518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:09,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43325 samples/s/p 3:03:57 } +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 631/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.6068294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43334 samples/s/p 3:03:54 } +2024-07-25 22:07:15,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 633/ 1625], loss: 1.459, per_step_time: 1472ms, lr: 1.606207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:15,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43376 samples/s/p 3:03:50 } +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 635/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.6055847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43213 samples/s/p 3:03:50 } +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 637/ 1625], loss: 1.307, per_step_time: 1475ms, lr: 1.6049618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42361 samples/s/p 3:04:05 } +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 639/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.6043394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42932 samples/s/p 3:03:50 } +2024-07-25 22:07:27,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 641/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.603717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:27,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43524 samples/s/p 3:03:35 } +2024-07-25 22:07:30,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 643/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.6030945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:30,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43512 samples/s/p 3:03:32 } +2024-07-25 22:07:33,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 645/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.6024716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:33,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43114 samples/s/p 3:03:37 } +2024-07-25 22:07:36,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 647/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.6018494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:36,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43436 samples/s/p 3:03:28 } +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 649/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.6012267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43158 samples/s/p 3:03:31 } +2024-07-25 22:07:42,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.600604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43361 samples/s/p 3:03:24 } +2024-07-25 22:07:45,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 653/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 1.5999816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:45,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43155 samples/s/p 3:03:25 } +2024-07-25 22:07:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 655/ 1625], loss: 1.053, per_step_time: 1469ms, lr: 1.599359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:48,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.44218 samples/s/p 3:03:00 } +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 657/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.5987367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43961 samples/s/p 3:03:03 } +2024-07-25 22:07:54,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 659/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5981137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43188 samples/s/p 3:03:15 } +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 661/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.597491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.44069 samples/s/p 3:02:55 } +2024-07-25 22:07:59,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 663/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.5968686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43931 samples/s/p 3:02:54 } +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 665/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 1.596246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43388 samples/s/p 3:03:02 } +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 667/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.5956231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43522 samples/s/p 3:02:57 } +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 669/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.5950009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43619 samples/s/p 3:02:52 } +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 671/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.5943782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43807 samples/s/p 3:02:45 } +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 673/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.5937554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.42708 samples/s/p 3:03:04 } +2024-07-25 22:08:17,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 675/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.5931328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:17,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43806 samples/s/p 3:02:39 } +2024-07-25 22:08:20,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 677/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.59251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43374 samples/s/p 3:02:45 } +2024-07-25 22:08:23,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 679/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.5918875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:23,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43507 samples/s/p 3:02:39 } +2024-07-25 22:08:26,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 681/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.5912645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:26,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.44011 samples/s/p 3:02:26 } +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 683/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 1.5906418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43531 samples/s/p 3:02:33 } +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 685/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 1.5900194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43075 samples/s/p 3:02:39 } +2024-07-25 22:08:35,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 687/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5893967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43761 samples/s/p 3:02:23 } +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 689/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 1.5887737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43917 samples/s/p 3:02:16 } +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 691/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.5881511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43146 samples/s/p 3:02:29 } +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 693/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 1.5875283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43705 samples/s/p 3:02:15 } +2024-07-25 22:08:47,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 695/ 1625], loss: 1.366, per_step_time: 1473ms, lr: 1.5869056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.42987 samples/s/p 3:02:26 } +2024-07-25 22:08:50,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 697/ 1625], loss: 1.421, per_step_time: 1472ms, lr: 1.586283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:50,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43146 samples/s/p 3:02:20 } +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 699/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5856602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43031 samples/s/p 3:02:20 } +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 701/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 1.5850375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43514 samples/s/p 3:02:07 } +2024-07-25 22:08:58,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 703/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.5844147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:58,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43430 samples/s/p 3:02:06 } +2024-07-25 22:09:01,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 705/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.5837917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:01,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43638 samples/s/p 3:01:59 } +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 707/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.583169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43008 samples/s/p 3:02:08 } +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 709/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 1.5825464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42519 samples/s/p 3:02:15 } +2024-07-25 22:09:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 711/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.5819236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:10,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43248 samples/s/p 3:01:58 } +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 713/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.5813008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43124 samples/s/p 3:01:57 } +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 715/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5806778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43686 samples/s/p 3:01:43 } +2024-07-25 22:09:19,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 717/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.580055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:19,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43517 samples/s/p 3:01:43 } +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 719/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5794321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43370 samples/s/p 3:01:43 } +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 721/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.5788095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43918 samples/s/p 3:01:29 } +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 723/ 1625], loss: 1.309, per_step_time: 1473ms, lr: 1.5781865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42882 samples/s/p 3:01:47 } +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 725/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.5775639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:31,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43569 samples/s/p 3:01:30 } +2024-07-25 22:09:34,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 727/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.5769408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43625 samples/s/p 3:01:26 } +2024-07-25 22:09:37,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 729/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.576318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:37,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43627 samples/s/p 3:01:23 } +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 731/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.5756952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43960 samples/s/p 3:01:14 } +2024-07-25 22:09:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 733/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5750724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:43,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43399 samples/s/p 3:01:22 } +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 735/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.5744496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43359 samples/s/p 3:01:20 } +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 737/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.5738266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43248 samples/s/p 3:01:19 } +2024-07-25 22:09:52,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 739/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.5732037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:52,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43970 samples/s/p 3:01:02 } +2024-07-25 22:09:55,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 741/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 1.5725807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:55,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.44039 samples/s/p 3:00:58 } +2024-07-25 22:09:57,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 743/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.5719581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43043 samples/s/p 3:01:15 } +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 745/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.571335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43290 samples/s/p 3:01:07 } +2024-07-25 22:10:03,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 747/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.5707124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42907 samples/s/p 3:01:11 } +2024-07-25 22:10:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 749/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5700893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43890 samples/s/p 3:00:49 } +2024-07-25 22:10:09,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 751/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.5694664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:09,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43510 samples/s/p 3:00:53 } +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 753/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.5688438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42751 samples/s/p 3:01:06 } +2024-07-25 22:10:15,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 755/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.5682208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:15,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43391 samples/s/p 3:00:50 } +2024-07-25 22:10:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 757/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 1.5675978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:18,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43138 samples/s/p 3:00:52 } +2024-07-25 22:10:21,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 759/ 1625], loss: 1.211, per_step_time: 1474ms, lr: 1.5669748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42475 samples/s/p 3:01:02 } +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 761/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.566352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43604 samples/s/p 3:00:37 } +2024-07-25 22:10:27,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 763/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5657291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:27,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43717 samples/s/p 3:00:32 } +2024-07-25 22:10:30,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 765/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 1.5651061e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43066 samples/s/p 3:00:42 } +2024-07-25 22:10:33,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 767/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 1.5644831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:33,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42798 samples/s/p 3:00:44 } +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 769/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5638603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43324 samples/s/p 3:00:31 } +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 771/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.5632373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43612 samples/s/p 3:00:22 } +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 773/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.5626145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43461 samples/s/p 3:00:22 } +2024-07-25 22:10:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 775/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.5619917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:45,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43615 samples/s/p 3:00:16 } +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 777/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 1.5613687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.44125 samples/s/p 3:00:03 } +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 779/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5607457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43661 samples/s/p 3:00:09 } +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 781/ 1625], loss: 0.989, per_step_time: 1470ms, lr: 1.5601228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43953 samples/s/p 3:00:00 } +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 783/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 1.5594998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.42774 samples/s/p 3:00:21 } +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 785/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 1.5588768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43549 samples/s/p 3:00:03 } +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 787/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 1.5582538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43094 samples/s/p 3:00:09 } +2024-07-25 22:11:05,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 789/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.5576308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44082 samples/s/p 2:59:46 } +2024-07-25 22:11:08,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 791/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 1.5570082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43834 samples/s/p 2:59:48 } +2024-07-25 22:11:11,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 793/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5563852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44061 samples/s/p 2:59:41 } +2024-07-25 22:11:14,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 795/ 1625], loss: 1.086, per_step_time: 1469ms, lr: 1.5557622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:14,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44559 samples/s/p 2:59:28 } +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 797/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5551394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:17,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43705 samples/s/p 2:59:42 } +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 799/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5545163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43426 samples/s/p 2:59:44 } +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 801/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.5538935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43685 samples/s/p 2:59:36 } +2024-07-25 22:11:26,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 803/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.5532705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43139 samples/s/p 2:59:44 } +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 805/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 1.5526475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.42936 samples/s/p 2:59:45 } +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 807/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.5520245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43628 samples/s/p 2:59:29 } +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 809/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 1.5514017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43372 samples/s/p 2:59:31 } +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 811/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5507787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43146 samples/s/p 2:59:32 } +2024-07-25 22:11:41,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 813/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5501559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43525 samples/s/p 2:59:22 } +2024-07-25 22:11:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 815/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.5495329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44185 samples/s/p 2:59:06 } +2024-07-25 22:11:47,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 817/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.5489097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43314 samples/s/p 2:59:20 } +2024-07-25 22:11:50,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 819/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 1.5482869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:50,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44010 samples/s/p 2:59:03 } +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 821/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.5476639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.42961 samples/s/p 2:59:21 } +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 823/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5470408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43626 samples/s/p 2:59:05 } +2024-07-25 22:11:58,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 825/ 1625], loss: 1.386, per_step_time: 1471ms, lr: 1.546418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:58,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43817 samples/s/p 2:58:58 } +2024-07-25 22:12:01,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 827/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.5457952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:01,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43479 samples/s/p 2:59:02 } +2024-07-25 22:12:04,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 829/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.545172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:04,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.44148 samples/s/p 2:58:46 } +2024-07-25 22:12:07,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 831/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.544549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.44024 samples/s/p 2:58:46 } +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 833/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.5439264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43751 samples/s/p 2:58:48 } +2024-07-25 22:12:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 835/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 1.5433032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.42962 samples/s/p 2:59:01 } +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 837/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 1.5426804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43016 samples/s/p 2:58:57 } +2024-07-25 22:12:19,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 839/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5420575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:19,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43612 samples/s/p 2:58:42 } +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 841/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.5414344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43322 samples/s/p 2:58:45 } +2024-07-25 22:12:25,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 843/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.5408115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:25,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43560 samples/s/p 2:58:37 } +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 845/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.5401885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.42954 samples/s/p 2:58:46 } +2024-07-25 22:12:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 847/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.5395655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43000 samples/s/p 2:58:42 } +2024-07-25 22:12:34,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 849/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.5389427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43415 samples/s/p 2:58:31 } +2024-07-25 22:12:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 851/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.5383197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43726 samples/s/p 2:58:22 } +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 853/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.5376969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43481 samples/s/p 2:58:24 } +2024-07-25 22:12:43,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 855/ 1625], loss: 1.178, per_step_time: 1468ms, lr: 1.5370739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.44651 samples/s/p 2:57:58 } +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 857/ 1625], loss: 1.029, per_step_time: 1470ms, lr: 1.5364512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43967 samples/s/p 2:58:08 } +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 859/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.535828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43674 samples/s/p 2:58:11 } +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 861/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.535205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:52,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43065 samples/s/p 2:58:20 } +2024-07-25 22:12:55,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 863/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.5345824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:55,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43591 samples/s/p 2:58:07 } +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 865/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5339594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43125 samples/s/p 2:58:13 } +2024-07-25 22:13:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 867/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.5333366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.42857 samples/s/p 2:58:16 } +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 869/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.5327136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43888 samples/s/p 2:57:52 } +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 871/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5320908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43704 samples/s/p 2:57:53 } +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 873/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.5314678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43604 samples/s/p 2:57:52 } +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 875/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.5308447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43317 samples/s/p 2:57:55 } +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 877/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 1.5302221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44229 samples/s/p 2:57:34 } +2024-07-25 22:13:18,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 879/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.529599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:18,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44100 samples/s/p 2:57:33 } +2024-07-25 22:13:21,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 881/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.5289763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:21,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43982 samples/s/p 2:57:33 } +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 883/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5283535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43899 samples/s/p 2:57:31 } +2024-07-25 22:13:27,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 885/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.5277303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:27,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43237 samples/s/p 2:57:42 } +2024-07-25 22:13:30,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 887/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 1.5271076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:30,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43445 samples/s/p 2:57:34 } +2024-07-25 22:13:33,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 889/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.5264846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:33,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43461 samples/s/p 2:57:31 } +2024-07-25 22:13:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 891/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.5258617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:36,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43688 samples/s/p 2:57:24 } +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 893/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.525239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42778 samples/s/p 2:57:39 } +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 895/ 1625], loss: 1.454, per_step_time: 1473ms, lr: 1.5246163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42981 samples/s/p 2:57:32 } +2024-07-25 22:13:45,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 897/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 1.52399325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.44264 samples/s/p 2:57:04 } +2024-07-25 22:13:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 899/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.5233704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43114 samples/s/p 2:57:23 } +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 901/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.5227477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43366 samples/s/p 2:57:15 } +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 903/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.5221247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43994 samples/s/p 2:57:00 } +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 905/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 1.5215018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43409 samples/s/p 2:57:09 } +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 907/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.5208791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.42881 samples/s/p 2:57:16 } +2024-07-25 22:14:02,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 909/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.5202561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43740 samples/s/p 2:56:56 } +2024-07-25 22:14:05,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 911/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.5196335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43631 samples/s/p 2:56:56 } +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 913/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.5190108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43563 samples/s/p 2:56:54 } +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 915/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 1.518388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43327 samples/s/p 2:56:56 } +2024-07-25 22:14:14,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 917/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.517765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:14,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43634 samples/s/p 2:56:47 } +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 919/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.5171423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43683 samples/s/p 2:56:43 } +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 921/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.5165197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43421 samples/s/p 2:56:45 } +2024-07-25 22:14:23,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 923/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.5158967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:23,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43248 samples/s/p 2:56:45 } +2024-07-25 22:14:26,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 925/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5152741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:26,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43629 samples/s/p 2:56:35 } +2024-07-25 22:14:29,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 927/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.5146513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:29,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43303 samples/s/p 2:56:38 } +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 929/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.5140283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43911 samples/s/p 2:56:24 } +2024-07-25 22:14:35,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 931/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.5134057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:35,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43005 samples/s/p 2:56:38 } +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 933/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.512783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43340 samples/s/p 2:56:29 } +2024-07-25 22:14:41,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 935/ 1625], loss: 0.977, per_step_time: 1469ms, lr: 1.51216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:41,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.44304 samples/s/p 2:56:07 } +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 937/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.51153745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42764 samples/s/p 2:56:34 } +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 939/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.5109149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43827 samples/s/p 2:56:11 } +2024-07-25 22:14:50,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 941/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.510292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:50,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43760 samples/s/p 2:56:09 } +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 943/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.5096692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43134 samples/s/p 2:56:18 } +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 945/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 1.5090467e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43111 samples/s/p 2:56:16 } +2024-07-25 22:14:58,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 947/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.5084238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:58,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43400 samples/s/p 2:56:07 } +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 949/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.5078011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43789 samples/s/p 2:55:57 } +2024-07-25 22:15:04,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 951/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5071786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:04,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43619 samples/s/p 2:55:57 } +2024-07-25 22:15:07,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 953/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.5065557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:07,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43592 samples/s/p 2:55:54 } +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 955/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.5059332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43374 samples/s/p 2:55:56 } +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 957/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5053105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43484 samples/s/p 2:55:51 } +2024-07-25 22:15:16,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 959/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 1.5046878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43752 samples/s/p 2:55:43 } +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 961/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5040652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43389 samples/s/p 2:55:47 } +2024-07-25 22:15:22,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 963/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5034426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:22,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.42791 samples/s/p 2:55:55 } +2024-07-25 22:15:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 965/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.5028201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43746 samples/s/p 2:55:34 } +2024-07-25 22:15:28,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 967/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.5021974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:28,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43518 samples/s/p 2:55:35 } +2024-07-25 22:15:31,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 969/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.5015748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43584 samples/s/p 2:55:31 } +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 971/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5009523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43779 samples/s/p 2:55:24 } +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 973/ 1625], loss: 1.243, per_step_time: 1469ms, lr: 1.5003295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.44237 samples/s/p 2:55:13 } +2024-07-25 22:15:40,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 975/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.499707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:40,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43239 samples/s/p 2:55:29 } +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 977/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.4990845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43525 samples/s/p 2:55:20 } +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 979/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.4984617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43405 samples/s/p 2:55:20 } +2024-07-25 22:15:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 981/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.4978394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43608 samples/s/p 2:55:13 } +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 983/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.4972169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43004 samples/s/p 2:55:22 } +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 985/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.4965942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43646 samples/s/p 2:55:06 } +2024-07-25 22:15:57,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 987/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.4959717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43509 samples/s/p 2:55:06 } +2024-07-25 22:16:00,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 989/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.49534935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43278 samples/s/p 2:55:08 } +2024-07-25 22:16:03,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 991/ 1625], loss: 1.453, per_step_time: 1470ms, lr: 1.4947266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.44074 samples/s/p 2:54:49 } +2024-07-25 22:16:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 993/ 1625], loss: 0.994, per_step_time: 1472ms, lr: 1.4941042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43288 samples/s/p 2:55:01 } +2024-07-25 22:16:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 995/ 1625], loss: 1.162, per_step_time: 1474ms, lr: 1.4934818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:09,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.42392 samples/s/p 2:55:16 } +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 997/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.4928592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43690 samples/s/p 2:54:48 } +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 999/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4922369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43066 samples/s/p 2:54:57 } +2024-07-25 22:16:18,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1001/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.4916144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43382 samples/s/p 2:54:48 } +2024-07-25 22:16:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1003/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.4909918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43516 samples/s/p 2:54:42 } +2024-07-25 22:16:24,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1005/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.4903695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43974 samples/s/p 2:54:31 } +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1007/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.48974705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43234 samples/s/p 2:54:42 } +2024-07-25 22:16:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1009/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.4891244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:30,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43164 samples/s/p 2:54:40 } +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1011/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.4885022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.42821 samples/s/p 2:54:44 } +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1013/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.4878799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43179 samples/s/p 2:54:34 } +2024-07-25 22:16:39,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1015/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.4872577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:39,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43243 samples/s/p 2:54:30 } +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1017/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.4866351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43488 samples/s/p 2:54:22 } +2024-07-25 22:16:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1019/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 1.4860129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:45,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43980 samples/s/p 2:54:10 } +2024-07-25 22:16:48,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1021/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.4853906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43591 samples/s/p 2:54:14 } +2024-07-25 22:16:51,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1023/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4847682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:51,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43118 samples/s/p 2:54:21 } +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1025/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 1.4841458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.44083 samples/s/p 2:53:59 } +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1027/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 1.4835237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43154 samples/s/p 2:54:14 } +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1029/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.4829013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43013 samples/s/p 2:54:14 } +2024-07-25 22:17:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1031/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.4822789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:02,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43563 samples/s/p 2:54:00 } +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1033/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.4816568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43875 samples/s/p 2:53:51 } +2024-07-25 22:17:08,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1035/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.4810344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.44158 samples/s/p 2:53:43 } +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1037/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.4804124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43903 samples/s/p 2:53:45 } +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1039/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.4797901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:14,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43487 samples/s/p 2:53:50 } +2024-07-25 22:17:17,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1041/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.4791677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43088 samples/s/p 2:53:55 } +2024-07-25 22:17:20,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1043/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.4785456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43311 samples/s/p 2:53:47 } +2024-07-25 22:17:23,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1045/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.4779234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:23,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43828 samples/s/p 2:53:35 } +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1047/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.4773011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43231 samples/s/p 2:53:43 } +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1049/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.4766791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43995 samples/s/p 2:53:25 } +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1051/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.4760571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44108 samples/s/p 2:53:20 } +2024-07-25 22:17:35,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1053/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.4754348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:35,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43165 samples/s/p 2:53:35 } +2024-07-25 22:17:38,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1055/ 1625], loss: 1.296, per_step_time: 1469ms, lr: 1.4748127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:38,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44381 samples/s/p 2:53:09 } +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1057/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.4741907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43589 samples/s/p 2:53:21 } +2024-07-25 22:17:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1059/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.4735684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43316 samples/s/p 2:53:24 } +2024-07-25 22:17:47,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1061/ 1625], loss: 1.281, per_step_time: 1474ms, lr: 1.4729463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.42736 samples/s/p 2:53:32 } +2024-07-25 22:17:50,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1063/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.4723245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:50,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43348 samples/s/p 2:53:17 } +2024-07-25 22:17:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1065/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.4717026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:53,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43879 samples/s/p 2:53:04 } +2024-07-25 22:17:56,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1067/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.4710804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:56,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43028 samples/s/p 2:53:17 } +2024-07-25 22:17:58,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1069/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.4704584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:58,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.44031 samples/s/p 2:52:55 } +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1071/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.4698364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42794 samples/s/p 2:53:16 } +2024-07-25 22:18:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1073/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 1.4692143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:04,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42617 samples/s/p 2:53:17 } +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1075/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4685923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43187 samples/s/p 2:53:03 } +2024-07-25 22:18:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1077/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.4679705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43562 samples/s/p 2:52:53 } +2024-07-25 22:18:13,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1079/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.4673484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42861 samples/s/p 2:53:03 } +2024-07-25 22:18:16,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1081/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 1.4667266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42903 samples/s/p 2:52:59 } +2024-07-25 22:18:19,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1083/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.4661047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43486 samples/s/p 2:52:45 } +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1085/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.46548255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43120 samples/s/p 2:52:49 } +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1087/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.4648608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43099 samples/s/p 2:52:47 } +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1089/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.464239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43814 samples/s/p 2:52:30 } +2024-07-25 22:18:31,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1091/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.4636169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:31,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43236 samples/s/p 2:52:38 } +2024-07-25 22:18:34,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1093/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.4629953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42798 samples/s/p 2:52:44 } +2024-07-25 22:18:37,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1095/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.4623735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:37,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43885 samples/s/p 2:52:20 } +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1097/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.4617516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43468 samples/s/p 2:52:25 } +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1099/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.4611298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43972 samples/s/p 2:52:12 } +2024-07-25 22:18:46,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1101/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.46050825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43884 samples/s/p 2:52:11 } +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1103/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 1.4598862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43268 samples/s/p 2:52:20 } +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1105/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4592645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:52,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43165 samples/s/p 2:52:19 } +2024-07-25 22:18:55,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1107/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.458643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43880 samples/s/p 2:52:02 } +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1109/ 1625], loss: 0.965, per_step_time: 1471ms, lr: 1.45802105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43528 samples/s/p 2:52:06 } +2024-07-25 22:19:00,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1111/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.4573995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:00,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.44006 samples/s/p 2:51:54 } +2024-07-25 22:19:03,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1113/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.4567779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:03,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43621 samples/s/p 2:51:58 } +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1115/ 1625], loss: 0.994, per_step_time: 1469ms, lr: 1.456156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.44345 samples/s/p 2:51:42 } +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1117/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4555345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43803 samples/s/p 2:51:49 } +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1119/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 1.45491285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43641 samples/s/p 2:51:49 } +2024-07-25 22:19:15,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1121/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.4542915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:15,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43602 samples/s/p 2:51:47 } +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1123/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.4536697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43180 samples/s/p 2:51:52 } +2024-07-25 22:19:21,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1125/ 1625], loss: 1.374, per_step_time: 1472ms, lr: 1.4530483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:21,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43190 samples/s/p 2:51:49 } +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1127/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 1.45242675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43339 samples/s/p 2:51:43 } +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1129/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.451805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43471 samples/s/p 2:51:38 } +2024-07-25 22:19:30,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1131/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.45118365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:30,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43725 samples/s/p 2:51:30 } +2024-07-25 22:19:33,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1133/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.4505621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:33,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.42793 samples/s/p 2:51:45 } +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1135/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.4499405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43385 samples/s/p 2:51:31 } +2024-07-25 22:19:39,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1137/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.4493192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43513 samples/s/p 2:51:25 } +2024-07-25 22:19:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1139/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.4486979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43490 samples/s/p 2:51:23 } +2024-07-25 22:19:45,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1141/ 1625], loss: 1.429, per_step_time: 1471ms, lr: 1.4480763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:45,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43550 samples/s/p 2:51:19 } +2024-07-25 22:19:48,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1143/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.4474548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:48,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43652 samples/s/p 2:51:14 } +2024-07-25 22:19:51,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1145/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.4468337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:51,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.44026 samples/s/p 2:51:04 } +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1147/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.4462121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43332 samples/s/p 2:51:14 } +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.4455908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43448 samples/s/p 2:51:09 } +2024-07-25 22:19:59,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1151/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4449695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:59,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43497 samples/s/p 2:51:05 } +2024-07-25 22:20:02,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1153/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.4443482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43409 samples/s/p 2:51:04 } +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1155/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.443727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.42717 samples/s/p 2:51:14 } +2024-07-25 22:20:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1157/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.4431057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43880 samples/s/p 2:50:49 } +2024-07-25 22:20:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1159/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.4424842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43329 samples/s/p 2:50:56 } +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1161/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.4418632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43671 samples/s/p 2:50:47 } +2024-07-25 22:20:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1163/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.441242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43648 samples/s/p 2:50:44 } +2024-07-25 22:20:20,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1165/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.4406206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:20,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43253 samples/s/p 2:50:49 } +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1167/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.4399996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43524 samples/s/p 2:50:41 } +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1169/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.4393786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43384 samples/s/p 2:50:41 } +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1171/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4387574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43869 samples/s/p 2:50:28 } +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1173/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4381362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43314 samples/s/p 2:50:36 } +2024-07-25 22:20:35,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1175/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.4375152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43207 samples/s/p 2:50:35 } +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1177/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4368942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43619 samples/s/p 2:50:24 } +2024-07-25 22:20:41,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1179/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.4362731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43312 samples/s/p 2:50:27 } +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1181/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.435652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43574 samples/s/p 2:50:19 } +2024-07-25 22:20:47,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1183/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 1.4350312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42696 samples/s/p 2:50:33 } +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1185/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.4344101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43377 samples/s/p 2:50:17 } +2024-07-25 22:20:53,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1187/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 1.4337891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42240 samples/s/p 2:50:36 } +2024-07-25 22:20:56,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1189/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.4331683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:56,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43686 samples/s/p 2:50:05 } +2024-07-25 22:20:58,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1191/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.4325473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43331 samples/s/p 2:50:09 } +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1193/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.4319266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43739 samples/s/p 2:49:59 } +2024-07-25 22:21:04,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1195/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.4313056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:04,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43895 samples/s/p 2:49:53 } +2024-07-25 22:21:07,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1197/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 1.43068455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:07,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.42573 samples/s/p 2:50:15 } +2024-07-25 22:21:10,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1199/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.4300639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:10,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43588 samples/s/p 2:49:53 } +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1201/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.4294431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43316 samples/s/p 2:49:55 } +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1203/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.4288221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43555 samples/s/p 2:49:47 } +2024-07-25 22:21:19,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1205/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.4282015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43785 samples/s/p 2:49:40 } +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1207/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.4275809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43355 samples/s/p 2:49:45 } +2024-07-25 22:21:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1209/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.42696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43233 samples/s/p 2:49:44 } +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1211/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.42633935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43954 samples/s/p 2:49:28 } +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1213/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.4257189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43872 samples/s/p 2:49:27 } +2024-07-25 22:21:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1215/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.425098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:34,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43230 samples/s/p 2:49:36 } +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1217/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.4244773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43746 samples/s/p 2:49:23 } +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1219/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.423857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43627 samples/s/p 2:49:22 } +2024-07-25 22:21:43,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1221/ 1625], loss: 0.899, per_step_time: 1471ms, lr: 1.4232365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:43,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43777 samples/s/p 2:49:17 } +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1223/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 1.4226158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43241 samples/s/p 2:49:24 } +2024-07-25 22:21:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1225/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.4219952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43767 samples/s/p 2:49:11 } +2024-07-25 22:21:52,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1227/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.4213749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43218 samples/s/p 2:49:18 } +2024-07-25 22:21:55,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1229/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 1.4207542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:55,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.42961 samples/s/p 2:49:20 } +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1231/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.4201337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43787 samples/s/p 2:49:02 } +2024-07-25 22:22:00,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1233/ 1625], loss: 0.931, per_step_time: 1470ms, lr: 1.4195134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:00,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44066 samples/s/p 2:48:54 } +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1235/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4188929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43370 samples/s/p 2:49:04 } +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1237/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.4182727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43834 samples/s/p 2:48:52 } +2024-07-25 22:22:09,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1239/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.4176523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43968 samples/s/p 2:48:47 } +2024-07-25 22:22:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1241/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.4170318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:12,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43713 samples/s/p 2:48:48 } +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.4164116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43307 samples/s/p 2:48:53 } +2024-07-25 22:22:18,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1245/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.4157913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43422 samples/s/p 2:48:48 } +2024-07-25 22:22:21,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1247/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.41517085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43125 samples/s/p 2:48:51 } +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1249/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.41455075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43779 samples/s/p 2:48:35 } +2024-07-25 22:22:27,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1251/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.4139307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:27,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43586 samples/s/p 2:48:36 } +2024-07-25 22:22:30,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1253/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.4133103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43217 samples/s/p 2:48:40 } +2024-07-25 22:22:33,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1255/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.4126901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:33,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43554 samples/s/p 2:48:31 } +2024-07-25 22:22:36,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1257/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.4120702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:36,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43283 samples/s/p 2:48:33 } +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1259/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4114499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43408 samples/s/p 2:48:28 } +2024-07-25 22:22:42,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1261/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.4108297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42648 samples/s/p 2:48:39 } +2024-07-25 22:22:45,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1263/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.4102098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43375 samples/s/p 2:48:22 } +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1265/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.4095896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43559 samples/s/p 2:48:16 } +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1267/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.4089698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42883 samples/s/p 2:48:26 } +2024-07-25 22:22:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1269/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 1.4083497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.44138 samples/s/p 2:47:59 } +2024-07-25 22:22:57,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1271/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.40773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:57,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43574 samples/s/p 2:48:07 } +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1273/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4071099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43731 samples/s/p 2:48:01 } +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1275/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 1.40649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43899 samples/s/p 2:47:55 } +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1277/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.4058703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43439 samples/s/p 2:48:00 } +2024-07-25 22:23:08,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1279/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4052503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43959 samples/s/p 2:47:48 } +2024-07-25 22:23:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1281/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.4046305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:11,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43950 samples/s/p 2:47:45 } +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1283/ 1625], loss: 1.002, per_step_time: 1469ms, lr: 1.4040107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44397 samples/s/p 2:47:34 } +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1285/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.4033908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:17,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44126 samples/s/p 2:47:36 } +2024-07-25 22:23:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1287/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.4027712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:20,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43778 samples/s/p 2:47:39 } +2024-07-25 22:23:23,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1289/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.4021515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43132 samples/s/p 2:47:48 } +2024-07-25 22:23:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1291/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4015315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44212 samples/s/p 2:47:26 } +2024-07-25 22:23:29,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1293/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.4009121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:29,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43038 samples/s/p 2:47:44 } +2024-07-25 22:23:32,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1295/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.4002926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:32,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43641 samples/s/p 2:47:30 } +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1297/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 1.3996728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.44041 samples/s/p 2:47:20 } +2024-07-25 22:23:38,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1299/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 1.3990531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:38,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42451 samples/s/p 2:47:46 } +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1301/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.3984339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.44034 samples/s/p 2:47:14 } +2024-07-25 22:23:44,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1303/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.39781405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:44,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43945 samples/s/p 2:47:13 } +2024-07-25 22:23:47,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1305/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.3971946e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43256 samples/s/p 2:47:23 } +2024-07-25 22:23:50,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1307/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.3965752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:50,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43631 samples/s/p 2:47:13 } +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1309/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.3959557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43499 samples/s/p 2:47:12 } +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1311/ 1625], loss: 1.327, per_step_time: 1474ms, lr: 1.3953364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.42578 samples/s/p 2:47:26 } +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1313/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.39471695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43712 samples/s/p 2:47:02 } +2024-07-25 22:24:01,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1315/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.3940975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:01,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.44052 samples/s/p 2:46:53 } +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1317/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.3934783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43873 samples/s/p 2:46:54 } +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1319/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 1.3928589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43751 samples/s/p 2:46:53 } +2024-07-25 22:24:10,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1321/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.3922399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43531 samples/s/p 2:46:54 } +2024-07-25 22:24:13,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1323/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 1.3916205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:13,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43177 samples/s/p 2:46:58 } +2024-07-25 22:24:16,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1325/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.3910014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43471 samples/s/p 2:46:49 } +2024-07-25 22:24:19,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1327/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.3903823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:19,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43314 samples/s/p 2:46:49 } +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1329/ 1625], loss: 1.335, per_step_time: 1470ms, lr: 1.3897629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.44138 samples/s/p 2:46:31 } +2024-07-25 22:24:25,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1331/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.3891439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:25,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43567 samples/s/p 2:46:39 } +2024-07-25 22:24:28,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1333/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.3885248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:28,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43480 samples/s/p 2:46:37 } +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1335/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.38790565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43916 samples/s/p 2:46:26 } +2024-07-25 22:24:34,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1337/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.3872867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:34,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43309 samples/s/p 2:46:35 } +2024-07-25 22:24:37,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1339/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.3866679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:37,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43844 samples/s/p 2:46:22 } +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1341/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.3860487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43319 samples/s/p 2:46:28 } +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1343/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.3854297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43656 samples/s/p 2:46:19 } +2024-07-25 22:24:46,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1345/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.384811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:46,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43622 samples/s/p 2:46:17 } +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1347/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.3841919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43590 samples/s/p 2:46:15 } +2024-07-25 22:24:52,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1349/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.3835732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:52,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43192 samples/s/p 2:46:19 } +2024-07-25 22:24:55,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1351/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 1.3829544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:55,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.44262 samples/s/p 2:45:56 } +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1353/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.38233545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.42778 samples/s/p 2:46:21 } +2024-07-25 22:25:00,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1355/ 1625], loss: 0.868, per_step_time: 1471ms, lr: 1.3817168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43783 samples/s/p 2:45:59 } +2024-07-25 22:25:03,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1357/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.3810981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43262 samples/s/p 2:46:06 } +2024-07-25 22:25:06,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1359/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.3804793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:06,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43760 samples/s/p 2:45:54 } +2024-07-25 22:25:09,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1361/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.3798607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:09,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43366 samples/s/p 2:45:58 } +2024-07-25 22:25:12,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1363/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.3792423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:12,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43999 samples/s/p 2:45:44 } +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1365/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.3786234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43791 samples/s/p 2:45:44 } +2024-07-25 22:25:18,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.3780049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:18,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43631 samples/s/p 2:45:44 } +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1369/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.3773865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43349 samples/s/p 2:45:47 } +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1371/ 1625], loss: 1.344, per_step_time: 1472ms, lr: 1.376768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43421 samples/s/p 2:45:42 } +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1373/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3761493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:27,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43291 samples/s/p 2:45:42 } +2024-07-25 22:25:30,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1375/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.3755311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:30,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43101 samples/s/p 2:45:42 } +2024-07-25 22:25:33,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1377/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.3749128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43111 samples/s/p 2:45:39 } +2024-07-25 22:25:36,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1379/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.3742942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:36,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.42975 samples/s/p 2:45:39 } +2024-07-25 22:25:39,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1381/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.3736759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43615 samples/s/p 2:45:24 } +2024-07-25 22:25:42,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1383/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 1.3730578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:42,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43490 samples/s/p 2:45:24 } +2024-07-25 22:25:45,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1385/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.3724393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43462 samples/s/p 2:45:21 } +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1387/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.371821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43803 samples/s/p 2:45:12 } +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1389/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.371203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43832 samples/s/p 2:45:08 } +2024-07-25 22:25:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1391/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.3705846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43412 samples/s/p 2:45:13 } +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1393/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.3699666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43193 samples/s/p 2:45:14 } +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1395/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.3693485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43246 samples/s/p 2:45:10 } +2024-07-25 22:26:02,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1397/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3687302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:02,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43393 samples/s/p 2:45:05 } +2024-07-25 22:26:05,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1399/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.3681123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:05,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43507 samples/s/p 2:45:00 } +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1401/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.3674943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43377 samples/s/p 2:44:59 } +2024-07-25 22:26:11,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1403/ 1625], loss: 1.364, per_step_time: 1473ms, lr: 1.366876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43059 samples/s/p 2:45:02 } +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1405/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.3662583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43875 samples/s/p 2:44:44 } +2024-07-25 22:26:17,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1407/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.3656406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43549 samples/s/p 2:44:47 } +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1409/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.3650226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43439 samples/s/p 2:44:46 } +2024-07-25 22:26:23,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1411/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.3644046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43956 samples/s/p 2:44:34 } +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1413/ 1625], loss: 1.189, per_step_time: 1474ms, lr: 1.363787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42664 samples/s/p 2:44:54 } +2024-07-25 22:26:29,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1415/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.363169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:29,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42300 samples/s/p 2:44:58 } +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1417/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3625513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43730 samples/s/p 2:44:29 } +2024-07-25 22:26:35,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1419/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.3619338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43610 samples/s/p 2:44:28 } +2024-07-25 22:26:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1421/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3613162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43699 samples/s/p 2:44:24 } +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1423/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.3606985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:41,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43693 samples/s/p 2:44:21 } +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1425/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.36008075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43813 samples/s/p 2:44:16 } +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1427/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.3594635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.44198 samples/s/p 2:44:06 } +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1429/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.3588457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43110 samples/s/p 2:44:23 } +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1431/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3582282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.42988 samples/s/p 2:44:22 } +2024-07-25 22:26:56,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1433/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.3576108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:56,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43594 samples/s/p 2:44:08 } +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1435/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.3569933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43359 samples/s/p 2:44:09 } +2024-07-25 22:27:01,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1437/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.356376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43551 samples/s/p 2:44:03 } +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1439/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.35575865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43564 samples/s/p 2:44:00 } +2024-07-25 22:27:07,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1441/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3551411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:07,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43310 samples/s/p 2:44:01 } +2024-07-25 22:27:10,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1443/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 1.3545241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42524 samples/s/p 2:44:13 } +2024-07-25 22:27:13,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1445/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 1.3539068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:13,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43702 samples/s/p 2:43:48 } +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1447/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.3532894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43772 samples/s/p 2:43:44 } +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1449/ 1625], loss: 1.323, per_step_time: 1474ms, lr: 1.3526724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42411 samples/s/p 2:44:06 } +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1451/ 1625], loss: 1.318, per_step_time: 1470ms, lr: 1.3520554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43852 samples/s/p 2:43:37 } +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1453/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.3514381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43525 samples/s/p 2:43:40 } +2024-07-25 22:27:28,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1455/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.350821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:28,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43354 samples/s/p 2:43:40 } +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1457/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.3502042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43915 samples/s/p 2:43:27 } +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1459/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.349587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42806 samples/s/p 2:43:44 } +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1461/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.34897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42895 samples/s/p 2:43:39 } +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1463/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.3483533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43366 samples/s/p 2:43:28 } +2024-07-25 22:27:43,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1465/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.3477362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43753 samples/s/p 2:43:18 } +2024-07-25 22:27:46,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1467/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 1.3471195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:46,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42592 samples/s/p 2:43:36 } +2024-07-25 22:27:49,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1469/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.3465027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:49,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43111 samples/s/p 2:43:24 } +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1471/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.3458862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43566 samples/s/p 2:43:13 } +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1473/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 1.3452693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:55,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42858 samples/s/p 2:43:22 } +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1475/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.34465245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43128 samples/s/p 2:43:15 } +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1477/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.344036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43044 samples/s/p 2:43:13 } +2024-07-25 22:28:03,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1479/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.3434192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:03,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43562 samples/s/p 2:43:01 } +2024-07-25 22:28:06,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1481/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3428028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43590 samples/s/p 2:42:57 } +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1483/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3421862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43316 samples/s/p 2:42:59 } +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1485/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 1.3415694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42733 samples/s/p 2:43:07 } +2024-07-25 22:28:15,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1487/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 1.3409533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:15,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44085 samples/s/p 2:42:40 } +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1489/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.3403368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43826 samples/s/p 2:42:41 } +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1491/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3397202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43241 samples/s/p 2:42:49 } +2024-07-25 22:28:24,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1493/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3391041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:24,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43621 samples/s/p 2:42:39 } +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1495/ 1625], loss: 1.274, per_step_time: 1470ms, lr: 1.3384878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44080 samples/s/p 2:42:28 } +2024-07-25 22:28:30,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1497/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.3378714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:30,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43564 samples/s/p 2:42:34 } +2024-07-25 22:28:33,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1499/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.33725525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44038 samples/s/p 2:42:23 } +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1501/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 1.3366392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43765 samples/s/p 2:42:25 } +2024-07-25 22:28:39,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1503/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.3360228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:39,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43406 samples/s/p 2:42:28 } +2024-07-25 22:28:42,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1505/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.3354069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43719 samples/s/p 2:42:20 } +2024-07-25 22:28:45,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1507/ 1625], loss: 1.030, per_step_time: 1469ms, lr: 1.3347908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:45,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44553 samples/s/p 2:42:02 } +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1509/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.3341745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43483 samples/s/p 2:42:18 } +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1511/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.3335588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.42990 samples/s/p 2:42:24 } +2024-07-25 22:28:54,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1513/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.3329428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:54,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43139 samples/s/p 2:42:18 } +2024-07-25 22:28:57,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1515/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 1.3323266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:57,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44036 samples/s/p 2:41:59 } +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1517/ 1625], loss: 1.049, per_step_time: 1470ms, lr: 1.331711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43860 samples/s/p 2:42:00 } +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1519/ 1625], loss: 0.962, per_step_time: 1471ms, lr: 1.3310952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43834 samples/s/p 2:41:57 } +2024-07-25 22:29:05,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1521/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.3304794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:05,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43466 samples/s/p 2:42:01 } +2024-07-25 22:29:08,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1523/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.3298636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:08,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44106 samples/s/p 2:41:46 } +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1525/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.329248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43161 samples/s/p 2:42:00 } +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1527/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.3286323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43216 samples/s/p 2:41:56 } +2024-07-25 22:29:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1529/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 1.3280165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44013 samples/s/p 2:41:39 } +2024-07-25 22:29:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1531/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 1.3274011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:20,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43059 samples/s/p 2:41:53 } +2024-07-25 22:29:23,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1533/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.3267857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43467 samples/s/p 2:41:43 } +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1535/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.32617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43080 samples/s/p 2:41:47 } +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1537/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3255545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.42960 samples/s/p 2:41:46 } +2024-07-25 22:29:32,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3249392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43316 samples/s/p 2:41:37 } +2024-07-25 22:29:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1541/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.3243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43667 samples/s/p 2:41:28 } +2024-07-25 22:29:38,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1543/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.3237083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:38,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.44060 samples/s/p 2:41:18 } +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1545/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.32309315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43379 samples/s/p 2:41:27 } +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1547/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.3224778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43199 samples/s/p 2:41:27 } +2024-07-25 22:29:47,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1549/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.3218627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:47,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43258 samples/s/p 2:41:23 } +2024-07-25 22:29:50,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1551/ 1625], loss: 1.002, per_step_time: 1472ms, lr: 1.3212475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43453 samples/s/p 2:41:17 } +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1553/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3206322e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43576 samples/s/p 2:41:12 } +2024-07-25 22:29:56,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1555/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.3200172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:56,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43541 samples/s/p 2:41:09 } +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1557/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 1.3194022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43206 samples/s/p 2:41:12 } +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1559/ 1625], loss: 1.376, per_step_time: 1474ms, lr: 1.31878705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42644 samples/s/p 2:41:20 } +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1561/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.3181722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42932 samples/s/p 2:41:11 } +2024-07-25 22:30:07,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1563/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.3175575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43869 samples/s/p 2:40:52 } +2024-07-25 22:30:10,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1565/ 1625], loss: 1.237, per_step_time: 1474ms, lr: 1.3169424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42714 samples/s/p 2:41:09 } +2024-07-25 22:30:13,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1567/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.3163276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43078 samples/s/p 2:41:00 } +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1569/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.315713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:16,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43136 samples/s/p 2:40:56 } +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1571/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.3150981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.44014 samples/s/p 2:40:37 } +2024-07-25 22:30:22,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1573/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.3144833e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43534 samples/s/p 2:40:43 } +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1575/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.3138689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43619 samples/s/p 2:40:39 } +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1577/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.3132543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43470 samples/s/p 2:40:38 } +2024-07-25 22:30:31,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1579/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.3126396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:31,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43590 samples/s/p 2:40:33 } +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1581/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.31202505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43168 samples/s/p 2:40:38 } +2024-07-25 22:30:37,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1583/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.3114108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:37,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.42853 samples/s/p 2:40:40 } +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1585/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.3107961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43522 samples/s/p 2:40:26 } +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1587/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3101817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43434 samples/s/p 2:40:24 } +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1589/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 1.3095676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43930 samples/s/p 2:40:13 } +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1591/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 1.30895305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43447 samples/s/p 2:40:18 } +2024-07-25 22:30:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1593/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 1.3083389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.42262 samples/s/p 2:40:36 } +2024-07-25 22:30:55,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1595/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.3077247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:55,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43308 samples/s/p 2:40:15 } +2024-07-25 22:30:58,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1597/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3071103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:58,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43440 samples/s/p 2:40:09 } +2024-07-25 22:31:01,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1599/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 1.3064964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:01,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43085 samples/s/p 2:40:13 } +2024-07-25 22:31:03,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1601/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3058823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:03,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43305 samples/s/p 2:40:06 } +2024-07-25 22:31:06,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1603/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.30526805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:06,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.44005 samples/s/p 2:39:51 } +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1605/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.3046542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43294 samples/s/p 2:40:00 } +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1607/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3040404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43377 samples/s/p 2:39:56 } +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1609/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.3034263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43240 samples/s/p 2:39:55 } +2024-07-25 22:31:18,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1611/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 1.3028125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:18,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43411 samples/s/p 2:39:49 } +2024-07-25 22:31:21,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1613/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.3021988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:21,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43360 samples/s/p 2:39:47 } +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1615/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43754 samples/s/p 2:39:37 } +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1617/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.3009712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.44036 samples/s/p 2:39:29 } +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1619/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.3003577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.42941 samples/s/p 2:39:46 } +2024-07-25 22:31:33,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1621/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 1.2997442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:33,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43044 samples/s/p 2:39:41 } +2024-07-25 22:31:36,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1623/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.2991304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43749 samples/s/p 2:39:26 } +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1625/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.2985169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43116 samples/s/p 2:39:34 } +2024-07-25 22:31:42,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 2/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.2979036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:42,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43685 samples/s/p 2:39:21 } +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 4/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 1.29729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43943 samples/s/p 2:39:13 } +2024-07-25 22:31:48,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 6/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 1.2966765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:48,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43586 samples/s/p 2:39:17 } +2024-07-25 22:31:51,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 8/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 1.2960634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:51,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.44022 samples/s/p 2:39:06 } +2024-07-25 22:31:54,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 10/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 1.2954499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43912 samples/s/p 2:39:05 } +2024-07-25 22:31:57,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 12/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2948367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43959 samples/s/p 2:39:01 } +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 14/ 1625], loss: 1.305, per_step_time: 1469ms, lr: 1.2942235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44315 samples/s/p 2:38:52 } +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 16/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.2936102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43449 samples/s/p 2:39:04 } +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 18/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.2929972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43865 samples/s/p 2:38:54 } +2024-07-25 22:32:08,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 20/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.29238415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:08,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43606 samples/s/p 2:38:56 } +2024-07-25 22:32:11,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 22/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 1.2917709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43241 samples/s/p 2:38:59 } +2024-07-25 22:32:14,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 1.29115815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:14,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43349 samples/s/p 2:38:54 } +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 26/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.2905453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43441 samples/s/p 2:38:50 } +2024-07-25 22:32:20,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 28/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.2899323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43704 samples/s/p 2:38:42 } +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 30/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2893195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43446 samples/s/p 2:38:44 } +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 32/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.2887069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43475 samples/s/p 2:38:40 } +2024-07-25 22:32:29,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 34/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.288094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:29,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43051 samples/s/p 2:38:45 } +2024-07-25 22:32:32,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 36/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.28748125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:32,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43425 samples/s/p 2:38:35 } +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 38/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.2868688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.42941 samples/s/p 2:38:41 } +2024-07-25 22:32:38,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 40/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 1.286256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43896 samples/s/p 2:38:21 } +2024-07-25 22:32:41,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 42/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.2856436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:41,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43339 samples/s/p 2:38:28 } +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 44/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.2850312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43552 samples/s/p 2:38:21 } +2024-07-25 22:32:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 46/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.2844189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:47,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43771 samples/s/p 2:38:15 } +2024-07-25 22:32:50,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 48/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.2838063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:50,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43486 samples/s/p 2:38:17 } +2024-07-25 22:32:53,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 50/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 1.2831941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.42900 samples/s/p 2:38:24 } +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 52/ 1625], loss: 1.058, per_step_time: 2853ms, lr: 1.2825818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 2.80377 samples/s/p 5:06:38 } +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 54/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2819694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43310 samples/s/p 2:38:11 } +2024-07-25 22:33:34,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 56/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.2813573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.42975 samples/s/p 2:38:14 } +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 58/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.2807452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43178 samples/s/p 2:38:07 } +2024-07-25 22:33:40,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 60/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.280133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:40,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43783 samples/s/p 2:37:54 } +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 62/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.2795211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43137 samples/s/p 2:38:02 } +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 64/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.2789093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43800 samples/s/p 2:37:48 } +2024-07-25 22:33:49,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 66/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.2782971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43418 samples/s/p 2:37:51 } +2024-07-25 22:33:52,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 68/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2776852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:52,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43122 samples/s/p 2:37:54 } +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 70/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.2770735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43542 samples/s/p 2:37:43 } +2024-07-25 22:33:58,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 72/ 1625], loss: 1.026, per_step_time: 1469ms, lr: 1.2764615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:58,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.44393 samples/s/p 2:37:26 } +2024-07-25 22:34:01,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 74/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.2758497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:01,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43717 samples/s/p 2:37:34 } +2024-07-25 22:34:04,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 76/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.2752383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:04,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43636 samples/s/p 2:37:33 } +2024-07-25 22:34:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 78/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.27462645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:07,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.42785 samples/s/p 2:37:45 } +2024-07-25 22:34:10,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 80/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.274015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43719 samples/s/p 2:37:26 } +2024-07-25 22:34:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 82/ 1625], loss: 1.343, per_step_time: 1470ms, lr: 1.27340345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43866 samples/s/p 2:37:20 } +2024-07-25 22:34:16,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 84/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.2727917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:16,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43351 samples/s/p 2:37:26 } +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 86/ 1625], loss: 1.037, per_step_time: 1470ms, lr: 1.27218045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.44132 samples/s/p 2:37:10 } +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 88/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 1.2715691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43456 samples/s/p 2:37:18 } +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 90/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.27095755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43273 samples/s/p 2:37:19 } +2024-07-25 22:34:27,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 92/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.2703464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43684 samples/s/p 2:37:09 } +2024-07-25 22:34:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 94/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.2697354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:30,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43667 samples/s/p 2:37:06 } +2024-07-25 22:34:33,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 96/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.2691242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:33,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43264 samples/s/p 2:37:10 } +2024-07-25 22:34:36,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 98/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.2685128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:37,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43448 samples/s/p 2:37:04 } +2024-07-25 22:34:40,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 100/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.2679019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:40,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43840 samples/s/p 2:36:54 } +2024-07-25 22:34:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 102/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.2672909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43279 samples/s/p 2:37:01 } +2024-07-25 22:34:46,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 104/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.2666797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:46,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.44085 samples/s/p 2:36:44 } +2024-07-25 22:34:49,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.266069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43420 samples/s/p 2:36:52 } +2024-07-25 22:34:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 108/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.2654583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:52,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43310 samples/s/p 2:36:51 } +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 110/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.2648473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43866 samples/s/p 2:36:39 } +2024-07-25 22:34:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 112/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.2642366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43161 samples/s/p 2:36:48 } +2024-07-25 22:35:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 114/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.263626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43318 samples/s/p 2:36:42 } +2024-07-25 22:35:03,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 116/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 1.2630152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43954 samples/s/p 2:36:29 } +2024-07-25 22:35:06,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 118/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2624045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43367 samples/s/p 2:36:36 } +2024-07-25 22:35:09,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 120/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.2617941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.42836 samples/s/p 2:36:42 } +2024-07-25 22:35:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 122/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.2611835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:12,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43508 samples/s/p 2:36:27 } +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 124/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.2605732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43250 samples/s/p 2:36:29 } +2024-07-25 22:35:18,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 126/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.2599628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43712 samples/s/p 2:36:18 } +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 128/ 1625], loss: 0.983, per_step_time: 1471ms, lr: 1.2593522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43537 samples/s/p 2:36:18 } +2024-07-25 22:35:24,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 130/ 1625], loss: 0.971, per_step_time: 1470ms, lr: 1.2587421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.44030 samples/s/p 2:36:07 } +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 132/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 1.25813185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43672 samples/s/p 2:36:10 } +2024-07-25 22:35:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 134/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2575216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:30,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43576 samples/s/p 2:36:09 } +2024-07-25 22:35:33,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 136/ 1625], loss: 0.975, per_step_time: 1472ms, lr: 1.2569116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:33,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43446 samples/s/p 2:36:08 } +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 138/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2563017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43110 samples/s/p 2:36:11 } +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 140/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2556915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43651 samples/s/p 2:35:58 } +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 142/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.2550816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43915 samples/s/p 2:35:51 } +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 144/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2544717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43408 samples/s/p 2:35:57 } +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 146/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 1.2538619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43496 samples/s/p 2:35:52 } +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 148/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 1.2532519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43957 samples/s/p 2:35:41 } +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 150/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.2526423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:54,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43150 samples/s/p 2:35:52 } +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 152/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.2520328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43558 samples/s/p 2:35:42 } +2024-07-25 22:35:59,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 154/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.2514231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:59,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43367 samples/s/p 2:35:43 } +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 156/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 1.2508134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43536 samples/s/p 2:35:37 } +2024-07-25 22:36:05,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 158/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 1.2502041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:05,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43309 samples/s/p 2:35:38 } +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 160/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.2495944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43432 samples/s/p 2:35:33 } +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 162/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 1.248985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43976 samples/s/p 2:35:20 } +2024-07-25 22:36:14,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 164/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.2483758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42793 samples/s/p 2:35:38 } +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 166/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.2477663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43279 samples/s/p 2:35:27 } +2024-07-25 22:36:20,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 168/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.24715725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:20,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43249 samples/s/p 2:35:24 } +2024-07-25 22:36:23,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 170/ 1625], loss: 1.299, per_step_time: 1474ms, lr: 1.2465481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:23,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42680 samples/s/p 2:35:31 } +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 172/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.2459387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43196 samples/s/p 2:35:19 } +2024-07-25 22:36:29,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 174/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2453298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43482 samples/s/p 2:35:11 } +2024-07-25 22:36:32,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 176/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.2447208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:32,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43172 samples/s/p 2:35:14 } +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 178/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.2441116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.42911 samples/s/p 2:35:15 } +2024-07-25 22:36:38,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 180/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2435029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43740 samples/s/p 2:34:58 } +2024-07-25 22:36:41,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 182/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.2428942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:41,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43334 samples/s/p 2:35:02 } +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.2422852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43574 samples/s/p 2:34:55 } +2024-07-25 22:36:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 186/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.24167655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:47,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43676 samples/s/p 2:34:50 } +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 188/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.241068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43962 samples/s/p 2:34:42 } +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 190/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.2404592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43246 samples/s/p 2:34:52 } +2024-07-25 22:36:56,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 192/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.23985055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43144 samples/s/p 2:34:51 } +2024-07-25 22:36:58,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 194/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.2392423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:58,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.44096 samples/s/p 2:34:31 } +2024-07-25 22:37:01,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 196/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.2386339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43666 samples/s/p 2:34:36 } +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 198/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 1.2380254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43022 samples/s/p 2:34:44 } +2024-07-25 22:37:07,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 200/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.237417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43720 samples/s/p 2:34:29 } +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 202/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.2368088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43938 samples/s/p 2:34:22 } +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 204/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2362005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43222 samples/s/p 2:34:32 } +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 206/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.2355923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43642 samples/s/p 2:34:21 } +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 208/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2349844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.44038 samples/s/p 2:34:12 } +2024-07-25 22:37:22,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 210/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.2343762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:22,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43412 samples/s/p 2:34:20 } +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 212/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.2337684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43524 samples/s/p 2:34:15 } +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 214/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.2331604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42596 samples/s/p 2:34:28 } +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 216/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.2325523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42942 samples/s/p 2:34:19 } +2024-07-25 22:37:34,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 1.2319448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42747 samples/s/p 2:34:19 } +2024-07-25 22:37:37,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 220/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.2313371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:37,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43530 samples/s/p 2:34:03 } +2024-07-25 22:37:40,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 222/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 1.2307292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.42846 samples/s/p 2:34:11 } +2024-07-25 22:37:43,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 224/ 1625], loss: 0.964, per_step_time: 1483ms, lr: 1.2301216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.39246 samples/s/p 2:35:10 } +2024-07-25 22:37:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 226/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.22951415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43488 samples/s/p 2:33:55 } +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 228/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 1.2289065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.44257 samples/s/p 2:33:39 } +2024-07-25 22:37:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 230/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.2282991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:52,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43655 samples/s/p 2:33:46 } +2024-07-25 22:37:55,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 232/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.2276918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43774 samples/s/p 2:33:41 } +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 234/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2270843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43239 samples/s/p 2:33:47 } +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 236/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.2264772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.44166 samples/s/p 2:33:28 } +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 238/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.2258699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43289 samples/s/p 2:33:40 } +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 240/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 1.2252626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43095 samples/s/p 2:33:41 } +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 242/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2246556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43791 samples/s/p 2:33:26 } +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 244/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.2240485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43610 samples/s/p 2:33:26 } +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.2234417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43189 samples/s/p 2:33:30 } +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 248/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.2228347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43727 samples/s/p 2:33:18 } +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 250/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.222228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43672 samples/s/p 2:33:16 } +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 252/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.2216211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43266 samples/s/p 2:33:20 } +2024-07-25 22:38:27,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 254/ 1625], loss: 1.171, per_step_time: 1485ms, lr: 1.2210142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.38609 samples/s/p 2:34:37 } +2024-07-25 22:38:30,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 256/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.22040765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:30,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43849 samples/s/p 2:33:04 } +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 258/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.2198011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43333 samples/s/p 2:33:10 } +2024-07-25 22:38:36,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 260/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.2191943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:36,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43812 samples/s/p 2:32:59 } +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 262/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.218588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43168 samples/s/p 2:33:07 } +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 264/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.21798175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43630 samples/s/p 2:32:56 } +2024-07-25 22:38:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 266/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.2173752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:45,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43091 samples/s/p 2:33:02 } +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 268/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.2167689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43808 samples/s/p 2:32:47 } +2024-07-25 22:38:51,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 270/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.2161628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:51,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.44166 samples/s/p 2:32:38 } +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 272/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.2155563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43632 samples/s/p 2:32:45 } +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 274/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.2149503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43016 samples/s/p 2:32:52 } +2024-07-25 22:39:00,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 276/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.2143444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:00,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43847 samples/s/p 2:32:35 } +2024-07-25 22:39:02,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 278/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.2137382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:02,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43645 samples/s/p 2:32:35 } +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 280/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.2131324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43671 samples/s/p 2:32:32 } +2024-07-25 22:39:08,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 282/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 1.2125265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:08,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43584 samples/s/p 2:32:31 } +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 284/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.2119205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43517 samples/s/p 2:32:29 } +2024-07-25 22:39:14,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 286/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.2113149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42926 samples/s/p 2:32:36 } +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 288/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.2107092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43187 samples/s/p 2:32:28 } +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 290/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.2101034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43232 samples/s/p 2:32:25 } +2024-07-25 22:39:23,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 292/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.209498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:23,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43409 samples/s/p 2:32:19 } +2024-07-25 22:39:26,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 294/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.2088927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42745 samples/s/p 2:32:27 } +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 296/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2082872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43536 samples/s/p 2:32:11 } +2024-07-25 22:39:32,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 298/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.2076816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:32,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43238 samples/s/p 2:32:13 } +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 300/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.20707655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43730 samples/s/p 2:32:02 } +2024-07-25 22:39:38,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 302/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 1.2064713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43541 samples/s/p 2:32:02 } +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 304/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.2058658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43731 samples/s/p 2:31:56 } +2024-07-25 22:39:44,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 306/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.2052609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:44,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43413 samples/s/p 2:31:58 } +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 308/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.204656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42962 samples/s/p 2:32:03 } +2024-07-25 22:39:50,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 310/ 1625], loss: 1.238, per_step_time: 1469ms, lr: 1.2040508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44279 samples/s/p 2:31:38 } +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 312/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.2034459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43532 samples/s/p 2:31:47 } +2024-07-25 22:39:56,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 314/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.2028412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:56,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44019 samples/s/p 2:31:36 } +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 316/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.2022362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42923 samples/s/p 2:31:52 } +2024-07-25 22:40:01,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 318/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.2016315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:01,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43692 samples/s/p 2:31:36 } +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 320/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.20102695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43821 samples/s/p 2:31:31 } +2024-07-25 22:40:07,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 322/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 1.2004221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43060 samples/s/p 2:31:41 } +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 324/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.1998178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43172 samples/s/p 2:31:36 } +2024-07-25 22:40:13,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 326/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.1992133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43766 samples/s/p 2:31:23 } +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 328/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.1986087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43428 samples/s/p 2:31:26 } +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 330/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1980044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43214 samples/s/p 2:31:26 } +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 332/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 1.1974002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.42764 samples/s/p 2:31:31 } +2024-07-25 22:40:25,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 334/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1967958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43301 samples/s/p 2:31:19 } +2024-07-25 22:40:28,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 336/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 1.1961917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:28,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43355 samples/s/p 2:31:15 } +2024-07-25 22:40:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 338/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.1955879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43636 samples/s/p 2:31:07 } +2024-07-25 22:40:34,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 340/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1949837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:34,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43440 samples/s/p 2:31:08 } +2024-07-25 22:40:37,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 342/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.1943797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:37,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43518 samples/s/p 2:31:03 } +2024-07-25 22:40:40,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 344/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.1937759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:40,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43284 samples/s/p 2:31:04 } +2024-07-25 22:40:43,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 346/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.1931721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:43,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43120 samples/s/p 2:31:04 } +2024-07-25 22:40:46,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 348/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1925681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43623 samples/s/p 2:30:53 } +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 1.1919647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.42794 samples/s/p 2:31:04 } +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 352/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.1913612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43299 samples/s/p 2:30:52 } +2024-07-25 22:40:55,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 354/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1907574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:55,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43356 samples/s/p 2:30:48 } +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 356/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 1.1901539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.44416 samples/s/p 2:30:28 } +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 358/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 1.1895506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43084 samples/s/p 2:30:47 } +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 360/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.1889471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43672 samples/s/p 2:30:34 } +2024-07-25 22:41:06,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 362/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1883438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:06,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43600 samples/s/p 2:30:33 } +2024-07-25 22:41:09,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 364/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.1877407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43144 samples/s/p 2:30:37 } +2024-07-25 22:41:12,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 366/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.1871373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43503 samples/s/p 2:30:28 } +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 368/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.1865344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43452 samples/s/p 2:30:26 } +2024-07-25 22:41:18,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 370/ 1625], loss: 1.003, per_step_time: 1472ms, lr: 1.1859313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:18,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43346 samples/s/p 2:30:25 } +2024-07-25 22:41:21,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 372/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.1853283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:21,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43835 samples/s/p 2:30:14 } +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 374/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1847255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43214 samples/s/p 2:30:21 } +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 376/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.1841228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43202 samples/s/p 2:30:19 } +2024-07-25 22:41:30,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 378/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 1.1835199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:30,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43097 samples/s/p 2:30:17 } +2024-07-25 22:41:33,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 380/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 1.1829171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.42931 samples/s/p 2:30:17 } +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 382/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 1.1823147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43733 samples/s/p 2:30:01 } +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 384/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 1.181712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43905 samples/s/p 2:29:55 } +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 386/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 1.1811094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43584 samples/s/p 2:29:58 } +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 388/ 1625], loss: 1.060, per_step_time: 1468ms, lr: 1.1805072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.44621 samples/s/p 2:29:37 } +2024-07-25 22:41:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 390/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.1799047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43405 samples/s/p 2:29:55 } +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 392/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.1793026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43561 samples/s/p 2:29:49 } +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 394/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.1787003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43513 samples/s/p 2:29:47 } +2024-07-25 22:41:57,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 396/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.1780983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:57,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43394 samples/s/p 2:29:46 } +2024-07-25 22:42:00,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 398/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1774961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:00,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43174 samples/s/p 2:29:47 } +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 400/ 1625], loss: 1.342, per_step_time: 1473ms, lr: 1.1768941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43109 samples/s/p 2:29:45 } +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 402/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.17629215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43646 samples/s/p 2:29:33 } +2024-07-25 22:42:08,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 404/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.17569025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:08,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43503 samples/s/p 2:29:32 } +2024-07-25 22:42:11,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 406/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.1750886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:11,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43278 samples/s/p 2:29:33 } +2024-07-25 22:42:14,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 408/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 1.1744868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:14,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44238 samples/s/p 2:29:14 } +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 410/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.173885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44061 samples/s/p 2:29:14 } +2024-07-25 22:42:20,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 412/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.17328345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:20,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43297 samples/s/p 2:29:24 } +2024-07-25 22:42:23,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 414/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1726819e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43353 samples/s/p 2:29:20 } +2024-07-25 22:42:26,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 416/ 1625], loss: 1.134, per_step_time: 1482ms, lr: 1.1720804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:26,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.39613 samples/s/p 2:30:19 } +2024-07-25 22:42:29,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 418/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 1.1714791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43649 samples/s/p 2:29:09 } +2024-07-25 22:42:32,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 420/ 1625], loss: 1.119, per_step_time: 1474ms, lr: 1.1708779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.42723 samples/s/p 2:29:22 } +2024-07-25 22:42:35,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 422/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.1702766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:35,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43160 samples/s/p 2:29:12 } +2024-07-25 22:42:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 424/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.1696753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43611 samples/s/p 2:29:01 } +2024-07-25 22:42:41,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 426/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1690743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43419 samples/s/p 2:29:01 } +2024-07-25 22:42:44,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 428/ 1625], loss: 1.312, per_step_time: 1477ms, lr: 1.1684731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.41608 samples/s/p 2:29:28 } +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 430/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.1678721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43940 samples/s/p 2:28:47 } +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 432/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.1672715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43445 samples/s/p 2:28:52 } +2024-07-25 22:42:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 434/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.1666704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:53,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43339 samples/s/p 2:28:51 } +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 436/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.1660698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43367 samples/s/p 2:28:48 } +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 438/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 1.1654692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43429 samples/s/p 2:28:44 } +2024-07-25 22:43:02,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 440/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.16486835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43762 samples/s/p 2:28:35 } +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 442/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.164268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43807 samples/s/p 2:28:31 } +2024-07-25 22:43:07,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 444/ 1625], loss: 0.998, per_step_time: 1471ms, lr: 1.1636675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43482 samples/s/p 2:28:34 } +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 446/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.1630674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43413 samples/s/p 2:28:32 } +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 448/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.1624667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43206 samples/s/p 2:28:33 } +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 450/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.1618667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43353 samples/s/p 2:28:27 } +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 452/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.1612665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43466 samples/s/p 2:28:22 } +2024-07-25 22:43:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 454/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.1606662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:22,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44002 samples/s/p 2:28:11 } +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 456/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.1600662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44087 samples/s/p 2:28:06 } +2024-07-25 22:43:28,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 458/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.1594662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:28,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43235 samples/s/p 2:28:17 } +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 460/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1588663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43733 samples/s/p 2:28:06 } +2024-07-25 22:43:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 462/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1582666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:34,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43794 samples/s/p 2:28:02 } +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 464/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.157667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44049 samples/s/p 2:27:55 } +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 466/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.1570671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44160 samples/s/p 2:27:50 } +2024-07-25 22:43:43,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 468/ 1625], loss: 1.305, per_step_time: 1474ms, lr: 1.1564674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:43,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42536 samples/s/p 2:28:14 } +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 470/ 1625], loss: 1.021, per_step_time: 1469ms, lr: 1.1558682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44247 samples/s/p 2:27:43 } +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 472/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.15526855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43254 samples/s/p 2:27:56 } +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 474/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1546691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43557 samples/s/p 2:27:48 } +2024-07-25 22:43:55,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 476/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.1540699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42939 samples/s/p 2:27:56 } +2024-07-25 22:43:58,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 478/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 1.1534705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:58,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43750 samples/s/p 2:27:39 } +2024-07-25 22:44:01,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 480/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.1528715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:01,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43502 samples/s/p 2:27:41 } +2024-07-25 22:44:03,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 482/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1522724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:03,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43789 samples/s/p 2:27:33 } +2024-07-25 22:44:06,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 484/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.1516731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:06,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43946 samples/s/p 2:27:27 } +2024-07-25 22:44:09,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 486/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 1.1510744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43402 samples/s/p 2:27:33 } +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 488/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 1.1504755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43917 samples/s/p 2:27:22 } +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 490/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1498765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43409 samples/s/p 2:27:27 } +2024-07-25 22:44:18,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.149278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:18,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.42898 samples/s/p 2:27:33 } +2024-07-25 22:44:21,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 494/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 1.1486794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43061 samples/s/p 2:27:27 } +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 496/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.1480808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43424 samples/s/p 2:27:18 } +2024-07-25 22:44:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 498/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.1474822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42925 samples/s/p 2:27:23 } +2024-07-25 22:44:30,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 500/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.1468839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42939 samples/s/p 2:27:20 } +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 502/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.1462855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42854 samples/s/p 2:27:19 } +2024-07-25 22:44:36,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 504/ 1625], loss: 1.083, per_step_time: 1485ms, lr: 1.1456871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:36,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.38671 samples/s/p 2:28:24 } +2024-07-25 22:44:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 506/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.145089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43971 samples/s/p 2:26:55 } +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 508/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.144491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42918 samples/s/p 2:27:09 } +2024-07-25 22:44:45,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 510/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.1438929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:45,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43249 samples/s/p 2:27:01 } +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 512/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.1432948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43679 samples/s/p 2:26:51 } +2024-07-25 22:44:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1426971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:51,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43405 samples/s/p 2:26:52 } +2024-07-25 22:44:54,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 516/ 1625], loss: 1.334, per_step_time: 1470ms, lr: 1.142099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44125 samples/s/p 2:26:37 } +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 518/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.14150125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44300 samples/s/p 2:26:32 } +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 520/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.1409037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43484 samples/s/p 2:26:42 } +2024-07-25 22:45:03,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 522/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.140306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43882 samples/s/p 2:26:33 } +2024-07-25 22:45:05,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 524/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.1397086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:05,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43851 samples/s/p 2:26:30 } +2024-07-25 22:45:08,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 526/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.1391111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43462 samples/s/p 2:26:33 } +2024-07-25 22:45:11,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 528/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.1385136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43660 samples/s/p 2:26:27 } +2024-07-25 22:45:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 530/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.1379165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:14,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44035 samples/s/p 2:26:18 } +2024-07-25 22:45:17,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 532/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.1373192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44076 samples/s/p 2:26:15 } +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 534/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 1.136722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43430 samples/s/p 2:26:22 } +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 536/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.136125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43323 samples/s/p 2:26:21 } +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 538/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 1.13552815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.42690 samples/s/p 2:26:28 } +2024-07-25 22:45:29,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 540/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.134931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43154 samples/s/p 2:26:18 } +2024-07-25 22:45:32,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 542/ 1625], loss: 1.105, per_step_time: 1469ms, lr: 1.1343341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44229 samples/s/p 2:25:58 } +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 544/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.1337375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43182 samples/s/p 2:26:12 } +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 546/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.1331409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43174 samples/s/p 2:26:09 } +2024-07-25 22:45:41,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 548/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.1325442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43668 samples/s/p 2:25:58 } +2024-07-25 22:45:44,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 550/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 1.13194765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:44,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43101 samples/s/p 2:26:04 } +2024-07-25 22:45:47,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 552/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 1.1313513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43872 samples/s/p 2:25:49 } +2024-07-25 22:45:50,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 554/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.13075475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:50,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43503 samples/s/p 2:25:52 } +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 556/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.1301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43665 samples/s/p 2:25:46 } +2024-07-25 22:45:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 558/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.1295624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.42999 samples/s/p 2:25:54 } +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 560/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 1.1289661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43403 samples/s/p 2:25:44 } +2024-07-25 22:46:02,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 562/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.12837015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.44161 samples/s/p 2:25:29 } +2024-07-25 22:46:05,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 564/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 1.1277741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:05,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43266 samples/s/p 2:25:41 } +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 566/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.127178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43360 samples/s/p 2:25:36 } +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 568/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.1265823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43801 samples/s/p 2:25:26 } +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 570/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 1.1259866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43698 samples/s/p 2:25:25 } +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 572/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.1253907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43462 samples/s/p 2:25:26 } +2024-07-25 22:46:19,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 574/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.1247953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:19,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43746 samples/s/p 2:25:18 } +2024-07-25 22:46:22,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 576/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.1241998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:22,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43673 samples/s/p 2:25:17 } +2024-07-25 22:46:25,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 578/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.1236043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:25,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42707 samples/s/p 2:25:29 } +2024-07-25 22:46:28,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 580/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1230089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43434 samples/s/p 2:25:14 } +2024-07-25 22:46:31,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 582/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.1224138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:31,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42843 samples/s/p 2:25:21 } +2024-07-25 22:46:34,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 584/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1218183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43382 samples/s/p 2:25:09 } +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 586/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.12122325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43200 samples/s/p 2:25:09 } +2024-07-25 22:46:40,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 588/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.12062835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:40,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43738 samples/s/p 2:24:58 } +2024-07-25 22:46:43,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 590/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 1.1200332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43045 samples/s/p 2:25:06 } +2024-07-25 22:46:46,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 592/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.1194385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:46,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43496 samples/s/p 2:24:56 } +2024-07-25 22:46:49,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 594/ 1625], loss: 0.902, per_step_time: 1469ms, lr: 1.11884365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:49,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44555 samples/s/p 2:24:36 } +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 596/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.118249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43467 samples/s/p 2:24:50 } +2024-07-25 22:46:55,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 598/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.1176542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43904 samples/s/p 2:24:40 } +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 600/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.1170596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43034 samples/s/p 2:24:51 } +2024-07-25 22:47:01,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 602/ 1625], loss: 1.317, per_step_time: 1474ms, lr: 1.1164652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42593 samples/s/p 2:24:56 } +2024-07-25 22:47:04,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 604/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 1.1158707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:04,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42933 samples/s/p 2:24:47 } +2024-07-25 22:47:06,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 606/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.1152764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:06,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44108 samples/s/p 2:24:25 } +2024-07-25 22:47:09,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 608/ 1625], loss: 1.287, per_step_time: 1470ms, lr: 1.1146822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:09,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44129 samples/s/p 2:24:22 } +2024-07-25 22:47:12,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 610/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.1140879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:12,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43060 samples/s/p 2:24:36 } +2024-07-25 22:47:15,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 612/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.1134939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:15,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43652 samples/s/p 2:24:24 } +2024-07-25 22:47:18,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 614/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.1128999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:18,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43625 samples/s/p 2:24:21 } +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 616/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1123058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43260 samples/s/p 2:24:24 } +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 618/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.111712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43319 samples/s/p 2:24:20 } +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 620/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.1111185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43292 samples/s/p 2:24:18 } +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 622/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 1.1105246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43896 samples/s/p 2:24:05 } +2024-07-25 22:47:33,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 624/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.109931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:33,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43584 samples/s/p 2:24:07 } +2024-07-25 22:47:36,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 626/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.1093375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43158 samples/s/p 2:24:11 } +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 628/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.108744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43074 samples/s/p 2:24:10 } +2024-07-25 22:47:42,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 630/ 1625], loss: 0.976, per_step_time: 1469ms, lr: 1.1081505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:42,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44363 samples/s/p 2:23:46 } +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 632/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.10755755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43562 samples/s/p 2:23:56 } +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 634/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.1069641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43444 samples/s/p 2:23:55 } +2024-07-25 22:47:51,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 636/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.1063711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43609 samples/s/p 2:23:49 } +2024-07-25 22:47:54,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 638/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.105778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:54,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43946 samples/s/p 2:23:41 } +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 640/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.10518495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43512 samples/s/p 2:23:45 } +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 642/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.1045922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43240 samples/s/p 2:23:46 } +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 644/ 1625], loss: 1.153, per_step_time: 1482ms, lr: 1.1039994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.39498 samples/s/p 2:24:43 } +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 646/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.1034069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43514 samples/s/p 2:23:36 } +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 648/ 1625], loss: 1.085, per_step_time: 1469ms, lr: 1.1028141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.44445 samples/s/p 2:23:18 } +2024-07-25 22:48:11,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 650/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 1.1022217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43697 samples/s/p 2:23:27 } +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 652/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.1016292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43210 samples/s/p 2:23:32 } +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 654/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.10103665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43072 samples/s/p 2:23:31 } +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 656/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.1004445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43800 samples/s/p 2:23:17 } +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 658/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.0998522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43261 samples/s/p 2:23:22 } +2024-07-25 22:48:26,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 660/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.09926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:26,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43348 samples/s/p 2:23:18 } +2024-07-25 22:48:29,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 662/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.098668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:29,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43668 samples/s/p 2:23:10 } +2024-07-25 22:48:32,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 664/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.0980762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43464 samples/s/p 2:23:10 } +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 666/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.0974843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43378 samples/s/p 2:23:09 } +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 668/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.0968924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43671 samples/s/p 2:23:01 } +2024-07-25 22:48:41,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 670/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.0963008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:41,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.44105 samples/s/p 2:22:51 } +2024-07-25 22:48:44,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 672/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 1.095709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.42965 samples/s/p 2:23:06 } +2024-07-25 22:48:47,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 674/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.0951174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43447 samples/s/p 2:22:56 } +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 676/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.0945262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43463 samples/s/p 2:22:53 } +2024-07-25 22:48:53,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 678/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.0939346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:53,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43711 samples/s/p 2:22:46 } +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 680/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.0933434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43318 samples/s/p 2:22:49 } +2024-07-25 22:48:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 682/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.0927522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43019 samples/s/p 2:22:51 } +2024-07-25 22:49:02,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 684/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.0921609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:02,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43472 samples/s/p 2:22:41 } +2024-07-25 22:49:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 686/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.0915701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:05,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43070 samples/s/p 2:22:44 } +2024-07-25 22:49:07,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 688/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.0909791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:07,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43278 samples/s/p 2:22:38 } +2024-07-25 22:49:10,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 690/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.0903882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:10,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43637 samples/s/p 2:22:29 } +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 692/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.0897974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43876 samples/s/p 2:22:23 } +2024-07-25 22:49:16,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 694/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.08920685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43564 samples/s/p 2:22:25 } +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 696/ 1625], loss: 1.368, per_step_time: 1472ms, lr: 1.088616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43394 samples/s/p 2:22:24 } +2024-07-25 22:49:22,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 698/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0880255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:22,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43526 samples/s/p 2:22:19 } +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 700/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.0874353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43510 samples/s/p 2:22:17 } +2024-07-25 22:49:28,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 702/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.086845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:28,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43239 samples/s/p 2:22:18 } +2024-07-25 22:49:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 704/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0862545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43409 samples/s/p 2:22:12 } +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 706/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.0856644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43062 samples/s/p 2:22:15 } +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 708/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 1.0850745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42869 samples/s/p 2:22:15 } +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 710/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.0844842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43779 samples/s/p 2:21:58 } +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.0838942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43995 samples/s/p 2:21:51 } +2024-07-25 22:49:46,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 714/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.0833046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:46,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42781 samples/s/p 2:22:07 } +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 716/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 1.0827147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43499 samples/s/p 2:21:53 } +2024-07-25 22:49:52,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 718/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.0821252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:52,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43742 samples/s/p 2:21:46 } +2024-07-25 22:49:55,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 720/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.08153545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.44468 samples/s/p 2:21:32 } +2024-07-25 22:49:58,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 722/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 1.0809458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43859 samples/s/p 2:21:39 } +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 724/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.0803566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43100 samples/s/p 2:21:48 } +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 726/ 1625], loss: 0.949, per_step_time: 1472ms, lr: 1.0797673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43286 samples/s/p 2:21:42 } +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 728/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.0791779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43419 samples/s/p 2:21:37 } +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 730/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.0785889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43832 samples/s/p 2:21:27 } +2024-07-25 22:50:12,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 732/ 1625], loss: 1.101, per_step_time: 1474ms, lr: 1.0779999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:12,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.42552 samples/s/p 2:21:44 } +2024-07-25 22:50:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 734/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.0774107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44028 samples/s/p 2:21:18 } +2024-07-25 22:50:18,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 736/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.0768219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43107 samples/s/p 2:21:30 } +2024-07-25 22:50:21,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 738/ 1625], loss: 1.001, per_step_time: 1470ms, lr: 1.0762332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:21,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44049 samples/s/p 2:21:12 } +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 740/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0756443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43707 samples/s/p 2:21:15 } +2024-07-25 22:50:27,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 742/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.0750557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43082 samples/s/p 2:21:21 } +2024-07-25 22:50:30,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 744/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.0744673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:30,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43672 samples/s/p 2:21:09 } +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 746/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 1.0738787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.42868 samples/s/p 2:21:19 } +2024-07-25 22:50:36,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 748/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.0732904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:36,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43527 samples/s/p 2:21:06 } +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 750/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0727022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43615 samples/s/p 2:21:01 } +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 752/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 1.0721141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43332 samples/s/p 2:21:03 } +2024-07-25 22:50:45,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 754/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0715258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:45,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43554 samples/s/p 2:20:56 } +2024-07-25 22:50:48,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 756/ 1625], loss: 0.860, per_step_time: 1470ms, lr: 1.0709378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:48,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43915 samples/s/p 2:20:48 } +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 758/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.07035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42802 samples/s/p 2:21:02 } +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 760/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 1.069762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.44276 samples/s/p 2:20:36 } +2024-07-25 22:50:57,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 762/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 1.0691743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:57,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43036 samples/s/p 2:20:53 } +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 764/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0685868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43025 samples/s/p 2:20:50 } +2024-07-25 22:51:03,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 766/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.067999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:03,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43231 samples/s/p 2:20:44 } +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 768/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.0674116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43077 samples/s/p 2:20:43 } +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 770/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.0668243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43192 samples/s/p 2:20:39 } +2024-07-25 22:51:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 772/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.0662368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:11,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43721 samples/s/p 2:20:27 } +2024-07-25 22:51:14,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 774/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 1.0656497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43268 samples/s/p 2:20:31 } +2024-07-25 22:51:17,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 776/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.0650628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:17,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43211 samples/s/p 2:20:29 } +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 778/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0644755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43730 samples/s/p 2:20:18 } +2024-07-25 22:51:23,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 780/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.0638886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:23,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43062 samples/s/p 2:20:26 } +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 782/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 1.0633018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43524 samples/s/p 2:20:16 } +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 784/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.062715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43065 samples/s/p 2:20:20 } +2024-07-25 22:51:32,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 786/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 1.0621283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:32,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43080 samples/s/p 2:20:17 } +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 788/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0615418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.42934 samples/s/p 2:20:16 } +2024-07-25 22:51:38,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 790/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.0609552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43500 samples/s/p 2:20:04 } +2024-07-25 22:51:41,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 792/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.0603689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:41,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43691 samples/s/p 2:19:58 } +2024-07-25 22:51:44,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 794/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.0597825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:44,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43127 samples/s/p 2:20:04 } +2024-07-25 22:51:47,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 796/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0591963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43203 samples/s/p 2:20:00 } +2024-07-25 22:51:50,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 798/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0586102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:50,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43326 samples/s/p 2:19:55 } +2024-07-25 22:51:53,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 800/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0580241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:53,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43694 samples/s/p 2:19:47 } +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 802/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.0574383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43322 samples/s/p 2:19:49 } +2024-07-25 22:51:59,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 804/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0568523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43754 samples/s/p 2:19:40 } +2024-07-25 22:52:02,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 806/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 1.0562667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:02,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43141 samples/s/p 2:19:46 } +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 808/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.055681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43404 samples/s/p 2:19:39 } +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 810/ 1625], loss: 0.900, per_step_time: 1470ms, lr: 1.05509525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43973 samples/s/p 2:19:28 } +2024-07-25 22:52:10,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 812/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.0545098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43558 samples/s/p 2:19:31 } +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 814/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0539245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43245 samples/s/p 2:19:33 } +2024-07-25 22:52:16,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 816/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0533389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43676 samples/s/p 2:19:23 } +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 818/ 1625], loss: 1.343, per_step_time: 1472ms, lr: 1.05275385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43391 samples/s/p 2:19:25 } +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 820/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.0521689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43810 samples/s/p 2:19:15 } +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 822/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.0515838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43485 samples/s/p 2:19:17 } +2024-07-25 22:52:28,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 824/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 1.0509987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:28,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43383 samples/s/p 2:19:16 } +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 826/ 1625], loss: 1.294, per_step_time: 1474ms, lr: 1.0504141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.42489 samples/s/p 2:19:27 } +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 828/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.0498291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43271 samples/s/p 2:19:12 } +2024-07-25 22:52:37,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 830/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.0492444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:37,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43547 samples/s/p 2:19:05 } +2024-07-25 22:52:40,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 832/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0486599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:40,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43494 samples/s/p 2:19:03 } +2024-07-25 22:52:43,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 834/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0480753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:43,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43675 samples/s/p 2:18:57 } +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 836/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.04749115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43934 samples/s/p 2:18:50 } +2024-07-25 22:52:49,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 838/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0469068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:49,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43530 samples/s/p 2:18:53 } +2024-07-25 22:52:52,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 840/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 1.04632245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:52,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43856 samples/s/p 2:18:45 } +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 842/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.0457384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43913 samples/s/p 2:18:41 } +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 844/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.0451544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44025 samples/s/p 2:18:37 } +2024-07-25 22:53:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 846/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0445704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:01,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43733 samples/s/p 2:18:38 } +2024-07-25 22:53:04,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 848/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0439867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:04,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43803 samples/s/p 2:18:34 } +2024-07-25 22:53:07,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 850/ 1625], loss: 1.063, per_step_time: 1469ms, lr: 1.043403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44393 samples/s/p 2:18:22 } +2024-07-25 22:53:09,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 852/ 1625], loss: 1.396, per_step_time: 1472ms, lr: 1.0428194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:09,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43115 samples/s/p 2:18:39 } +2024-07-25 22:53:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 854/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0422356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:12,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43475 samples/s/p 2:18:30 } +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 856/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.0416523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43859 samples/s/p 2:18:22 } +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 858/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0410689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43395 samples/s/p 2:18:26 } +2024-07-25 22:53:21,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 860/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.0404857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:21,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43649 samples/s/p 2:18:19 } +2024-07-25 22:53:24,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 862/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0399025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.44005 samples/s/p 2:18:11 } +2024-07-25 22:53:27,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 864/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0393195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:27,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43708 samples/s/p 2:18:12 } +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 866/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 1.03873645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43131 samples/s/p 2:18:18 } +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 868/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0381535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43531 samples/s/p 2:18:09 } +2024-07-25 22:53:36,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 870/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.03757075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43368 samples/s/p 2:18:09 } +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 872/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.036988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43778 samples/s/p 2:17:59 } +2024-07-25 22:53:42,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 874/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.0364055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:42,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43780 samples/s/p 2:17:56 } +2024-07-25 22:53:45,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 876/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.035823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44300 samples/s/p 2:17:46 } +2024-07-25 22:53:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 878/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.03524035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:48,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43739 samples/s/p 2:17:51 } +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 880/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 1.0346582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44077 samples/s/p 2:17:43 } +2024-07-25 22:53:54,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 882/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.0340759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:54,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44097 samples/s/p 2:17:40 } +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 884/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.0334936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43485 samples/s/p 2:17:46 } +2024-07-25 22:54:00,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 886/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.0329118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43323 samples/s/p 2:17:46 } +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 888/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.03233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43091 samples/s/p 2:17:46 } +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 890/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.031748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43283 samples/s/p 2:17:40 } +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 892/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.0311662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43122 samples/s/p 2:17:40 } +2024-07-25 22:54:11,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 894/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0305846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43164 samples/s/p 2:17:36 } +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 896/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0300029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.44139 samples/s/p 2:17:19 } +2024-07-25 22:54:17,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 898/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.0294214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:17,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43019 samples/s/p 2:17:33 } +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 900/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 1.0288402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.42755 samples/s/p 2:17:34 } +2024-07-25 22:54:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 902/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.0282591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:23,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43740 samples/s/p 2:17:16 } +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 904/ 1625], loss: 1.455, per_step_time: 1470ms, lr: 1.0276777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44099 samples/s/p 2:17:07 } +2024-07-25 22:54:29,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 906/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 1.0270966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:29,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43594 samples/s/p 2:17:12 } +2024-07-25 22:54:32,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 908/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.0265158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:32,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43992 samples/s/p 2:17:03 } +2024-07-25 22:54:35,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 910/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 1.0259348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43005 samples/s/p 2:17:15 } +2024-07-25 22:54:38,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 912/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.025354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:38,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43548 samples/s/p 2:17:04 } +2024-07-25 22:54:41,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 914/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0247734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:41,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43278 samples/s/p 2:17:05 } +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 916/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.0241926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44089 samples/s/p 2:16:50 } +2024-07-25 22:54:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 918/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0236123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:47,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44144 samples/s/p 2:16:46 } +2024-07-25 22:54:50,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 920/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.0230318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:50,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43444 samples/s/p 2:16:54 } +2024-07-25 22:54:53,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 922/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.0224514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:53,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43989 samples/s/p 2:16:43 } +2024-07-25 22:54:56,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 924/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.0218713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:56,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43068 samples/s/p 2:16:54 } +2024-07-25 22:54:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 926/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0212912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:59,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43483 samples/s/p 2:16:44 } +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 928/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.020711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43665 samples/s/p 2:16:39 } +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 930/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.0201312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43647 samples/s/p 2:16:36 } +2024-07-25 22:55:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 932/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.0195516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43632 samples/s/p 2:16:33 } +2024-07-25 22:55:10,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 934/ 1625], loss: 1.258, per_step_time: 1474ms, lr: 1.0189717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:10,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.42401 samples/s/p 2:16:49 } +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 936/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.01839205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43094 samples/s/p 2:16:36 } +2024-07-25 22:55:16,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 938/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.0178127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:16,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43445 samples/s/p 2:16:27 } +2024-07-25 22:55:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 940/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.017233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:19,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43297 samples/s/p 2:16:27 } +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 942/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.0166537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43527 samples/s/p 2:16:20 } +2024-07-25 22:55:25,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 944/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 1.0160747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43023 samples/s/p 2:16:25 } +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 946/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.0154953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43925 samples/s/p 2:16:08 } +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 948/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.0149164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43400 samples/s/p 2:16:13 } +2024-07-25 22:55:34,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 950/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 1.0143374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43882 samples/s/p 2:16:03 } +2024-07-25 22:55:37,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 952/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.0137587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:37,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43494 samples/s/p 2:16:06 } +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 954/ 1625], loss: 1.328, per_step_time: 1470ms, lr: 1.0131798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44166 samples/s/p 2:15:53 } +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 956/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.0126013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43068 samples/s/p 2:16:06 } +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 958/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.0120229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43812 samples/s/p 2:15:52 } +2024-07-25 22:55:49,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 960/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0114442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:49,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43553 samples/s/p 2:15:53 } +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 962/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.0108661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:52,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43310 samples/s/p 2:15:54 } +2024-07-25 22:55:55,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 964/ 1625], loss: 1.234, per_step_time: 1469ms, lr: 1.0102878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44398 samples/s/p 2:15:35 } +2024-07-25 22:55:58,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 966/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0097095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43603 samples/s/p 2:15:44 } +2024-07-25 22:56:01,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 968/ 1625], loss: 1.263, per_step_time: 1470ms, lr: 1.0091317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43996 samples/s/p 2:15:35 } +2024-07-25 22:56:04,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 970/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.0085536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:04,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43385 samples/s/p 2:15:41 } +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 972/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.0079756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43409 samples/s/p 2:15:38 } +2024-07-25 22:56:09,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 974/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0073981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:09,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43748 samples/s/p 2:15:30 } +2024-07-25 22:56:12,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 976/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.00682055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:12,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43436 samples/s/p 2:15:31 } +2024-07-25 22:56:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 978/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0062429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:15,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43699 samples/s/p 2:15:25 } +2024-07-25 22:56:18,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 980/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 1.0056654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:18,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43392 samples/s/p 2:15:26 } +2024-07-25 22:56:21,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 982/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0050881e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:21,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43140 samples/s/p 2:15:27 } +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 984/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.0045107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43465 samples/s/p 2:15:19 } +2024-07-25 22:56:27,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 986/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.0039336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43642 samples/s/p 2:15:14 } +2024-07-25 22:56:30,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 988/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0033567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:30,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43353 samples/s/p 2:15:15 } +2024-07-25 22:56:33,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 990/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.0027797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:33,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.42878 samples/s/p 2:15:19 } +2024-07-25 22:56:36,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 992/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.00220295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:36,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43159 samples/s/p 2:15:12 } +2024-07-25 22:56:39,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 994/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.00162615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:39,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43088 samples/s/p 2:15:10 } +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 996/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.00104935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43745 samples/s/p 2:14:57 } +2024-07-25 22:56:45,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 998/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.0004731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43526 samples/s/p 2:14:58 } +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1000/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 9.998966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43816 samples/s/p 2:14:50 } +2024-07-25 22:56:51,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1002/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 9.993204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.44058 samples/s/p 2:14:44 } +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1004/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 9.9874405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43716 samples/s/p 2:14:46 } +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1006/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 9.981681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43527 samples/s/p 2:14:46 } +2024-07-25 22:57:00,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1008/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 9.975919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:00,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43171 samples/s/p 2:14:48 } +2024-07-25 22:57:03,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1010/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 9.970159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43116 samples/s/p 2:14:46 } +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1012/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.964402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43899 samples/s/p 2:14:32 } +2024-07-25 22:57:08,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1014/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 9.958644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:08,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43489 samples/s/p 2:14:35 } +2024-07-25 22:57:11,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1016/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 9.952889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43787 samples/s/p 2:14:27 } +2024-07-25 22:57:14,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1018/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 9.9471345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43635 samples/s/p 2:14:27 } +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1020/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 9.941381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43566 samples/s/p 2:14:25 } +2024-07-25 22:57:20,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1022/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 9.935626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:20,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.44055 samples/s/p 2:14:15 } +2024-07-25 22:57:23,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1024/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 9.929874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:23,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43260 samples/s/p 2:14:23 } +2024-07-25 22:57:26,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1026/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.924124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43432 samples/s/p 2:14:18 } +2024-07-25 22:57:29,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1028/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 9.918373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43315 samples/s/p 2:14:17 } +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1030/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 9.9126255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43791 samples/s/p 2:14:07 } +2024-07-25 22:57:35,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1032/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 9.906877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:35,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43066 samples/s/p 2:14:15 } +2024-07-25 22:57:38,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1034/ 1625], loss: 1.413, per_step_time: 1471ms, lr: 9.901129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43623 samples/s/p 2:14:03 } +2024-07-25 22:57:41,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1036/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 9.895383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43798 samples/s/p 2:13:58 } +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1038/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 9.88964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43405 samples/s/p 2:14:01 } +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1040/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 9.883894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43397 samples/s/p 2:13:58 } +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1042/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 9.878152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43673 samples/s/p 2:13:51 } +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1044/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 9.872412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43396 samples/s/p 2:13:52 } +2024-07-25 22:57:56,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1046/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 9.866669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:56,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.42807 samples/s/p 2:13:58 } +2024-07-25 22:57:59,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1048/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 9.860931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:59,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43278 samples/s/p 2:13:48 } +2024-07-25 22:58:02,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1050/ 1625], loss: 0.856, per_step_time: 1471ms, lr: 9.855194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:02,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43806 samples/s/p 2:13:37 } +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1052/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 9.849455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43769 samples/s/p 2:13:35 } +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1054/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 9.843717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43249 samples/s/p 2:13:39 } +2024-07-25 22:58:10,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1056/ 1625], loss: 1.144, per_step_time: 1469ms, lr: 9.837982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:10,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.44371 samples/s/p 2:13:20 } +2024-07-25 22:58:13,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1058/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 9.83225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43232 samples/s/p 2:13:34 } +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1060/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 9.826515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43359 samples/s/p 2:13:29 } +2024-07-25 22:58:19,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1062/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 9.820782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43421 samples/s/p 2:13:25 } +2024-07-25 22:58:22,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1064/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 9.815052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:22,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43171 samples/s/p 2:13:26 } +2024-07-25 22:58:25,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1066/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 9.8093205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:25,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.44056 samples/s/p 2:13:10 } +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1068/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 9.803592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.42356 samples/s/p 2:13:32 } +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1070/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 9.797865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43138 samples/s/p 2:13:17 } +2024-07-25 22:58:34,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1072/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 9.792137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:34,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43782 samples/s/p 2:13:05 } +2024-07-25 22:58:37,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1074/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 9.786411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:37,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43625 samples/s/p 2:13:04 } +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1076/ 1625], loss: 1.238, per_step_time: 1476ms, lr: 9.780687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.41812 samples/s/p 2:13:28 } +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1078/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 9.774961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43666 samples/s/p 2:12:58 } +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1080/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 9.769238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43669 samples/s/p 2:12:55 } +2024-07-25 22:58:49,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1082/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 9.7635175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:49,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43522 samples/s/p 2:12:54 } +2024-07-25 22:58:52,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1084/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.757795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:52,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43715 samples/s/p 2:12:48 } +2024-07-25 22:58:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1086/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 9.752076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:55,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44027 samples/s/p 2:12:41 } +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1088/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 9.74636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43860 samples/s/p 2:12:40 } +2024-07-25 22:59:01,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1090/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 9.74064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44071 samples/s/p 2:12:34 } +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1092/ 1625], loss: 0.914, per_step_time: 1470ms, lr: 9.734924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44090 samples/s/p 2:12:31 } +2024-07-25 22:59:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1094/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 9.72921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:07,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43617 samples/s/p 2:12:35 } +2024-07-25 22:59:09,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1096/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.723492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:09,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43447 samples/s/p 2:12:35 } +2024-07-25 22:59:12,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1098/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 9.71778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:12,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43097 samples/s/p 2:12:37 } +2024-07-25 22:59:15,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1100/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 9.712069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:15,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43420 samples/s/p 2:12:29 } +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1102/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 9.706359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43018 samples/s/p 2:12:32 } +2024-07-25 22:59:21,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1104/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 9.700648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:21,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42573 samples/s/p 2:12:36 } +2024-07-25 22:59:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1106/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.694939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:24,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42962 samples/s/p 2:12:27 } +2024-07-25 22:59:27,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1108/ 1625], loss: 1.100, per_step_time: 1475ms, lr: 9.689233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42282 samples/s/p 2:12:34 } +2024-07-25 22:59:30,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1110/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 9.683524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43321 samples/s/p 2:12:16 } +2024-07-25 22:59:33,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1112/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 9.677818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43486 samples/s/p 2:12:11 } +2024-07-25 22:59:36,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1114/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 9.672114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:36,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43712 samples/s/p 2:12:04 } +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1116/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 9.66641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43866 samples/s/p 2:11:59 } +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1118/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 9.660708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43498 samples/s/p 2:12:02 } +2024-07-25 22:59:45,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1120/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.655007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:45,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43843 samples/s/p 2:11:54 } +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1122/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.649304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43534 samples/s/p 2:11:55 } +2024-07-25 22:59:51,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1124/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 9.643607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43935 samples/s/p 2:11:46 } +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1126/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 9.637908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42837 samples/s/p 2:11:59 } +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1128/ 1625], loss: 1.062, per_step_time: 1474ms, lr: 9.632209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42634 samples/s/p 2:11:59 } +2024-07-25 23:00:00,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1130/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 9.626515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:00,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43181 samples/s/p 2:11:48 } +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1132/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.620821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.44049 samples/s/p 2:11:33 } +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1134/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 9.615126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43211 samples/s/p 2:11:42 } +2024-07-25 23:00:08,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1136/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 9.609432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:08,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.42721 samples/s/p 2:11:46 } +2024-07-25 23:00:11,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1138/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 9.603742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43769 samples/s/p 2:11:28 } +2024-07-25 23:00:14,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1140/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 9.5980495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:14,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43758 samples/s/p 2:11:25 } +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1142/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 9.592361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43564 samples/s/p 2:11:25 } +2024-07-25 23:00:20,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1144/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 9.586673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43091 samples/s/p 2:11:29 } +2024-07-25 23:00:23,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1146/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 9.580984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:23,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42988 samples/s/p 2:11:28 } +2024-07-25 23:00:26,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1148/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 9.5752985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43770 samples/s/p 2:11:13 } +2024-07-25 23:00:29,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1150/ 1625], loss: 1.355, per_step_time: 1470ms, lr: 9.569613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:29,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43875 samples/s/p 2:11:09 } +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1152/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 9.563931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42984 samples/s/p 2:11:19 } +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1154/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 9.558246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.44192 samples/s/p 2:10:58 } +2024-07-25 23:00:38,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1156/ 1625], loss: 0.959, per_step_time: 1473ms, lr: 9.552564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42948 samples/s/p 2:11:14 } +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1158/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 9.546885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43178 samples/s/p 2:11:07 } +2024-07-25 23:00:44,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1160/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 9.541203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42833 samples/s/p 2:11:09 } +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1162/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.535527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43776 samples/s/p 2:10:53 } +2024-07-25 23:00:50,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1164/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 9.529848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:50,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43378 samples/s/p 2:10:56 } +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1166/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 9.52417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43128 samples/s/p 2:10:56 } +2024-07-25 23:00:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1168/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 9.518497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43015 samples/s/p 2:10:55 } +2024-07-25 23:00:59,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1170/ 1625], loss: 1.179, per_step_time: 1469ms, lr: 9.5128225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:59,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44243 samples/s/p 2:10:34 } +2024-07-25 23:01:02,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1172/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 9.507149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:02,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43827 samples/s/p 2:10:37 } +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1174/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 9.5014775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43521 samples/s/p 2:10:39 } +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1176/ 1625], loss: 0.935, per_step_time: 1469ms, lr: 9.495808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44553 samples/s/p 2:10:21 } +2024-07-25 23:01:10,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1178/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 9.490135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:10,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43376 samples/s/p 2:10:35 } +2024-07-25 23:01:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1180/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 9.484467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43476 samples/s/p 2:10:31 } +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1182/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 9.478801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43529 samples/s/p 2:10:27 } +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1184/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 9.473134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43011 samples/s/p 2:10:31 } +2024-07-25 23:01:22,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1186/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 9.46747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43550 samples/s/p 2:10:21 } +2024-07-25 23:01:25,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1188/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 9.461806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43948 samples/s/p 2:10:12 } +2024-07-25 23:01:28,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1190/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 9.45614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:28,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43238 samples/s/p 2:10:19 } +2024-07-25 23:01:31,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1192/ 1625], loss: 1.165, per_step_time: 1475ms, lr: 9.450478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:31,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42322 samples/s/p 2:10:30 } +2024-07-25 23:01:34,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1194/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 9.4448205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42811 samples/s/p 2:10:20 } +2024-07-25 23:01:37,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1196/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 9.439157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:37,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43745 samples/s/p 2:10:03 } +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1198/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 9.433498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43549 samples/s/p 2:10:03 } +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1200/ 1625], loss: 1.250, per_step_time: 1475ms, lr: 9.427843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42215 samples/s/p 2:10:19 } +2024-07-25 23:01:46,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1202/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 9.422187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43648 samples/s/p 2:09:56 } +2024-07-25 23:01:49,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1204/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 9.416531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:49,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43655 samples/s/p 2:09:53 } +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1206/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 9.410877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42842 samples/s/p 2:10:01 } +2024-07-25 23:01:55,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1208/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 9.405225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43304 samples/s/p 2:09:52 } +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1210/ 1625], loss: 0.981, per_step_time: 1471ms, lr: 9.399572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43585 samples/s/p 2:09:45 } +2024-07-25 23:02:01,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1212/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 9.393922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:01,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43439 samples/s/p 2:09:44 } +2024-07-25 23:02:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1214/ 1625], loss: 1.097, per_step_time: 1469ms, lr: 9.388271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:04,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44262 samples/s/p 2:09:29 } +2024-07-25 23:02:07,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1216/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 9.382622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43446 samples/s/p 2:09:38 } +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1218/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 9.376975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44150 samples/s/p 2:09:25 } +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1220/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.371329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43814 samples/s/p 2:09:27 } +2024-07-25 23:02:15,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1222/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 9.365684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:15,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43901 samples/s/p 2:09:23 } +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1224/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 9.36004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43648 samples/s/p 2:09:23 } +2024-07-25 23:02:21,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1226/ 1625], loss: 0.925, per_step_time: 1471ms, lr: 9.354397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43663 samples/s/p 2:09:20 } +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1228/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 9.348755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43945 samples/s/p 2:09:13 } +2024-07-25 23:02:27,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1230/ 1625], loss: 0.979, per_step_time: 1469ms, lr: 9.3431145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:27,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.44312 samples/s/p 2:09:05 } +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1232/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 9.337477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43933 samples/s/p 2:09:08 } +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1234/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 9.331837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43051 samples/s/p 2:09:17 } +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1236/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 9.326199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43295 samples/s/p 2:09:11 } +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1238/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 9.320565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43176 samples/s/p 2:09:09 } +2024-07-25 23:02:42,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1240/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 9.314927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:42,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43539 samples/s/p 2:09:01 } +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1242/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.309294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43175 samples/s/p 2:09:04 } +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1244/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 9.303664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43635 samples/s/p 2:08:54 } +2024-07-25 23:02:51,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1246/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 9.29803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:51,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43246 samples/s/p 2:08:57 } +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1248/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 9.292402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43753 samples/s/p 2:08:47 } +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1250/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 9.286772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43575 samples/s/p 2:08:46 } +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1252/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 9.281144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43254 samples/s/p 2:08:48 } +2024-07-25 23:03:03,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1254/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 9.275517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43916 samples/s/p 2:08:35 } +2024-07-25 23:03:06,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1256/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 9.269891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.44023 samples/s/p 2:08:31 } +2024-07-25 23:03:09,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1258/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 9.264267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.42999 samples/s/p 2:08:43 } +2024-07-25 23:03:11,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1260/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 9.258643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43850 samples/s/p 2:08:28 } +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1262/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 9.25302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43148 samples/s/p 2:08:35 } +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1264/ 1625], loss: 1.306, per_step_time: 1470ms, lr: 9.247399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43872 samples/s/p 2:08:21 } +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1266/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 9.2417795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:20,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43984 samples/s/p 2:08:17 } +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1268/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 9.236161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43557 samples/s/p 2:08:20 } +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1270/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.230546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43448 samples/s/p 2:08:18 } +2024-07-25 23:03:29,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1272/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 9.2249265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:29,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43768 samples/s/p 2:08:11 } +2024-07-25 23:03:32,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1274/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 9.21931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:32,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43828 samples/s/p 2:08:07 } +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1276/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 9.2137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42825 samples/s/p 2:08:18 } +2024-07-25 23:03:38,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1278/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 9.208084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43504 samples/s/p 2:08:06 } +2024-07-25 23:03:41,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1280/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 9.202471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:41,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43954 samples/s/p 2:07:57 } +2024-07-25 23:03:44,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1282/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.196864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:44,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43453 samples/s/p 2:08:01 } +2024-07-25 23:03:47,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1284/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 9.191251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43537 samples/s/p 2:07:57 } +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1286/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 9.1856455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43413 samples/s/p 2:07:55 } +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1288/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 9.180038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42197 samples/s/p 2:08:10 } +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1290/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 9.174429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43135 samples/s/p 2:07:53 } +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1292/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.168827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43204 samples/s/p 2:07:50 } +2024-07-25 23:04:02,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1294/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 9.163223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:02,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.42911 samples/s/p 2:07:51 } +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1296/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 9.157618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43552 samples/s/p 2:07:39 } +2024-07-25 23:04:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1298/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 9.152019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43888 samples/s/p 2:07:31 } +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1300/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 9.146418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43770 samples/s/p 2:07:30 } +2024-07-25 23:04:13,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1302/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 9.140819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43486 samples/s/p 2:07:31 } +2024-07-25 23:04:16,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1304/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 9.13522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43458 samples/s/p 2:07:28 } +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1306/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 9.129623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43413 samples/s/p 2:07:26 } +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1308/ 1625], loss: 0.967, per_step_time: 1472ms, lr: 9.124028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43167 samples/s/p 2:07:27 } +2024-07-25 23:04:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1310/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.118434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43949 samples/s/p 2:07:13 } +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1312/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 9.112841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43495 samples/s/p 2:07:16 } +2024-07-25 23:04:31,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1314/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 9.107252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43746 samples/s/p 2:07:10 } +2024-07-25 23:04:34,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1316/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 9.101657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43275 samples/s/p 2:07:13 } +2024-07-25 23:04:37,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1318/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 9.0960675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:37,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43858 samples/s/p 2:07:02 } +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1320/ 1625], loss: 1.109, per_step_time: 1475ms, lr: 9.090482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.42358 samples/s/p 2:07:20 } +2024-07-25 23:04:43,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1322/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.084893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:43,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43456 samples/s/p 2:07:02 } +2024-07-25 23:04:46,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1324/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 9.079306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43204 samples/s/p 2:07:02 } +2024-07-25 23:04:49,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1326/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 9.073725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:49,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43554 samples/s/p 2:06:55 } +2024-07-25 23:04:52,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1328/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 9.068137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43183 samples/s/p 2:06:57 } +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1330/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.062558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43573 samples/s/p 2:06:48 } +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1332/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 9.056976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.44034 samples/s/p 2:06:39 } +2024-07-25 23:05:01,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1334/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 9.051393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:01,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43544 samples/s/p 2:06:43 } +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1336/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 9.045816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43756 samples/s/p 2:06:37 } +2024-07-25 23:05:07,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1338/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.040239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:07,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43146 samples/s/p 2:06:43 } +2024-07-25 23:05:09,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1340/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 9.034659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:10,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43540 samples/s/p 2:06:34 } +2024-07-25 23:05:12,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1342/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 9.029087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43628 samples/s/p 2:06:30 } +2024-07-25 23:05:15,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1344/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 9.023513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:15,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43352 samples/s/p 2:06:31 } +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1346/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 9.017939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43864 samples/s/p 2:06:21 } +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1348/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 9.012367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43582 samples/s/p 2:06:22 } +2024-07-25 23:05:24,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1350/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 9.006797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43781 samples/s/p 2:06:16 } +2024-07-25 23:05:27,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1352/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 9.001227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43946 samples/s/p 2:06:11 } +2024-07-25 23:05:30,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1354/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 8.995658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42730 samples/s/p 2:06:25 } +2024-07-25 23:05:33,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1356/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 8.990091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42591 samples/s/p 2:06:24 } +2024-07-25 23:05:36,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1358/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 8.984529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:36,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43134 samples/s/p 2:06:13 } +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1360/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 8.978961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44093 samples/s/p 2:05:57 } +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1362/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 8.973397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43850 samples/s/p 2:05:57 } +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1364/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 8.967838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.42752 samples/s/p 2:06:10 } +2024-07-25 23:05:48,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1366/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 8.962274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:48,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43048 samples/s/p 2:06:03 } +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1368/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 8.956715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43498 samples/s/p 2:05:54 } +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1370/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.951159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43832 samples/s/p 2:05:46 } +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1372/ 1625], loss: 1.034, per_step_time: 1468ms, lr: 8.945599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44711 samples/s/p 2:05:31 } +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1374/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 8.940045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43657 samples/s/p 2:05:42 } +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1376/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 8.93449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43661 samples/s/p 2:05:39 } +2024-07-25 23:06:06,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1378/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 8.928933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43110 samples/s/p 2:05:44 } +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1380/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 8.923384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43156 samples/s/p 2:05:41 } +2024-07-25 23:06:11,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1382/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 8.917832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:11,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42630 samples/s/p 2:05:45 } +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1384/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 8.912279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43172 samples/s/p 2:05:35 } +2024-07-25 23:06:17,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1386/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 8.906733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:17,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42991 samples/s/p 2:05:34 } +2024-07-25 23:06:20,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1388/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 8.9011855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43740 samples/s/p 2:05:21 } +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1390/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 8.8956385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.44000 samples/s/p 2:05:14 } +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1392/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 8.890093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43725 samples/s/p 2:05:15 } +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1394/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 8.884548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43413 samples/s/p 2:05:16 } +2024-07-25 23:06:32,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1396/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 8.879007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:32,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43627 samples/s/p 2:05:11 } +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1398/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 8.873465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42849 samples/s/p 2:05:18 } +2024-07-25 23:06:38,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1400/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 8.8679235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:38,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.44137 samples/s/p 2:04:58 } +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1402/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.862388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42801 samples/s/p 2:05:13 } +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1404/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 8.856847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43154 samples/s/p 2:05:05 } +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1406/ 1625], loss: 0.921, per_step_time: 1470ms, lr: 8.851311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44000 samples/s/p 2:04:51 } +2024-07-25 23:06:50,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1408/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 8.845777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:50,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43956 samples/s/p 2:04:48 } +2024-07-25 23:06:53,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1410/ 1625], loss: 1.035, per_step_time: 1474ms, lr: 8.840241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:53,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42693 samples/s/p 2:05:03 } +2024-07-25 23:06:56,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.834708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:56,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43840 samples/s/p 2:04:44 } +2024-07-25 23:06:59,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1414/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 8.829178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:59,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43036 samples/s/p 2:04:52 } +2024-07-25 23:07:02,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1416/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 8.823646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:02,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43707 samples/s/p 2:04:40 } +2024-07-25 23:07:05,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1418/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 8.81812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43748 samples/s/p 2:04:36 } +2024-07-25 23:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1420/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 8.81259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44094 samples/s/p 2:04:29 } +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1422/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 8.80706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44268 samples/s/p 2:04:23 } +2024-07-25 23:07:13,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1424/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 8.801538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43180 samples/s/p 2:04:35 } +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1426/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 8.796013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44216 samples/s/p 2:04:18 } +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1428/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 8.79049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43962 samples/s/p 2:04:19 } +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1430/ 1625], loss: 1.459, per_step_time: 1470ms, lr: 8.7849685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43950 samples/s/p 2:04:16 } +2024-07-25 23:07:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1432/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 8.779447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43761 samples/s/p 2:04:16 } +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1434/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 8.773927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43085 samples/s/p 2:04:22 } +2024-07-25 23:07:31,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1436/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 8.76841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:31,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43051 samples/s/p 2:04:20 } +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1438/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.762892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43388 samples/s/p 2:04:12 } +2024-07-25 23:07:37,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1440/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 8.757377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:37,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43382 samples/s/p 2:04:09 } +2024-07-25 23:07:40,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1442/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.751863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:40,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43201 samples/s/p 2:04:09 } +2024-07-25 23:07:43,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1444/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 8.746349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:43,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43320 samples/s/p 2:04:04 } +2024-07-25 23:07:46,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1446/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 8.740837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43786 samples/s/p 2:03:55 } +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1448/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.7353255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43059 samples/s/p 2:04:02 } +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1450/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.729817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43809 samples/s/p 2:03:49 } +2024-07-25 23:07:52,300 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:08:28,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1452/ 1625], loss: 1.025, per_step_time: 2123ms, lr: 8.724312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:28,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 3.76751 samples/s/p 2:58:39 } +2024-07-25 23:08:31,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1454/ 1625], loss: 1.010, per_step_time: 1475ms, lr: 8.718801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:31,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.42306 samples/s/p 2:04:03 } +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1456/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 8.713299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43294 samples/s/p 2:03:47 } +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1458/ 1625], loss: 1.152, per_step_time: 1469ms, lr: 8.707794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44243 samples/s/p 2:03:31 } +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1460/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 8.702288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44062 samples/s/p 2:03:30 } +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1462/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 8.696789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43835 samples/s/p 2:03:31 } +2024-07-25 23:08:46,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1464/ 1625], loss: 1.277, per_step_time: 1478ms, lr: 8.691288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.41173 samples/s/p 2:04:04 } +2024-07-25 23:08:49,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1466/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 8.685786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:49,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43365 samples/s/p 2:03:31 } +2024-07-25 23:08:52,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1468/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 8.680291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43623 samples/s/p 2:03:25 } +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1470/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 8.674794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43606 samples/s/p 2:03:22 } +2024-07-25 23:08:58,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1472/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 8.669298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:58,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43524 samples/s/p 2:03:20 } +2024-07-25 23:09:01,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1474/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 8.663804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42887 samples/s/p 2:03:26 } +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1476/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 8.658311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43338 samples/s/p 2:03:17 } +2024-07-25 23:09:07,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1478/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 8.652818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43377 samples/s/p 2:03:13 } +2024-07-25 23:09:10,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1480/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 8.647328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42662 samples/s/p 2:03:20 } +2024-07-25 23:09:13,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1482/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 8.641839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:13,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42805 samples/s/p 2:03:15 } +2024-07-25 23:09:16,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1484/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.63635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43224 samples/s/p 2:03:07 } +2024-07-25 23:09:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1486/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 8.630864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:18,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43861 samples/s/p 2:02:55 } +2024-07-25 23:09:21,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1488/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 8.625377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43506 samples/s/p 2:02:57 } +2024-07-25 23:09:24,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1490/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.619893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43070 samples/s/p 2:03:00 } +2024-07-25 23:09:27,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1492/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 8.614409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43807 samples/s/p 2:02:47 } +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1494/ 1625], loss: 0.945, per_step_time: 1474ms, lr: 8.6089285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.42527 samples/s/p 2:03:01 } +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1496/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 8.603447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43630 samples/s/p 2:02:43 } +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1498/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 8.597967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:36,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43458 samples/s/p 2:02:43 } +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1500/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 8.592493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.44125 samples/s/p 2:02:31 } +2024-07-25 23:09:42,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1502/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 8.587017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43519 samples/s/p 2:02:36 } +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1504/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 8.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43808 samples/s/p 2:02:29 } +2024-07-25 23:09:48,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1506/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 8.576068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:48,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43741 samples/s/p 2:02:27 } +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1508/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 8.570594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42943 samples/s/p 2:02:35 } +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1510/ 1625], loss: 1.236, per_step_time: 1474ms, lr: 8.565119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42565 samples/s/p 2:02:37 } +2024-07-25 23:09:57,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1512/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 8.559652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:57,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42853 samples/s/p 2:02:30 } +2024-07-25 23:10:00,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1514/ 1625], loss: 0.986, per_step_time: 1469ms, lr: 8.554183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:00,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.44460 samples/s/p 2:02:06 } +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1516/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 8.548715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43824 samples/s/p 2:02:11 } +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1518/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 8.543249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43887 samples/s/p 2:02:07 } +2024-07-25 23:10:09,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1520/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 8.537784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:09,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.44078 samples/s/p 2:02:02 } +2024-07-25 23:10:12,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1522/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.532321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43108 samples/s/p 2:02:12 } +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1524/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.5268575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43452 samples/s/p 2:02:05 } +2024-07-25 23:10:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1526/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 8.521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:17,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43685 samples/s/p 2:01:58 } +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1528/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 8.515936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43336 samples/s/p 2:02:00 } +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1530/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 8.5104775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.44084 samples/s/p 2:01:47 } +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1532/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 8.505021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:26,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43422 samples/s/p 2:01:53 } +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1534/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 8.499564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43789 samples/s/p 2:01:45 } +2024-07-25 23:10:32,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1536/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 8.494109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43849 samples/s/p 2:01:42 } +2024-07-25 23:10:35,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1538/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 8.488656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42903 samples/s/p 2:01:51 } +2024-07-25 23:10:38,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1540/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 8.483204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:38,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43926 samples/s/p 2:01:35 } +2024-07-25 23:10:41,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1542/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 8.477753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:41,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43077 samples/s/p 2:01:43 } +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1544/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 8.472306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43644 samples/s/p 2:01:33 } +2024-07-25 23:10:47,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1546/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 8.4668545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:47,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42656 samples/s/p 2:01:43 } +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1548/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 8.461408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43199 samples/s/p 2:01:33 } +2024-07-25 23:10:53,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1550/ 1625], loss: 1.124, per_step_time: 1482ms, lr: 8.455965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.39638 samples/s/p 2:02:18 } +2024-07-25 23:10:56,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1552/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 8.45052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:56,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.42996 samples/s/p 2:01:29 } +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1554/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 8.445074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43350 samples/s/p 2:01:22 } +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1556/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 8.439636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43844 samples/s/p 2:01:12 } +2024-07-25 23:11:05,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1558/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 8.434195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43693 samples/s/p 2:01:11 } +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1560/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 8.428756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43758 samples/s/p 2:01:07 } +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1562/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 8.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43667 samples/s/p 2:01:06 } +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1564/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.41788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43584 samples/s/p 2:01:04 } +2024-07-25 23:11:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1566/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 8.412446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:17,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43397 samples/s/p 2:01:03 } +2024-07-25 23:11:19,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1568/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.407012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43568 samples/s/p 2:00:58 } +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1570/ 1625], loss: 1.127, per_step_time: 1474ms, lr: 8.401578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.42695 samples/s/p 2:01:07 } +2024-07-25 23:11:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1572/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 8.396148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.44348 samples/s/p 2:00:42 } +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1574/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 8.390716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43909 samples/s/p 2:00:45 } +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1576/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 8.385287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43812 samples/s/p 2:00:43 } +2024-07-25 23:11:34,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1578/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 8.37986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43906 samples/s/p 2:00:39 } +2024-07-25 23:11:37,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1580/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.3744335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43694 samples/s/p 2:00:39 } +2024-07-25 23:11:40,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1582/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 8.369009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:40,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43709 samples/s/p 2:00:36 } +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1584/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 8.363585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43334 samples/s/p 2:00:38 } +2024-07-25 23:11:46,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1586/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 8.358163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:46,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.41968 samples/s/p 2:00:53 } +2024-07-25 23:11:49,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1588/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 8.352746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:49,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43570 samples/s/p 2:00:29 } +2024-07-25 23:11:52,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1590/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.347323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:52,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43350 samples/s/p 2:00:29 } +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1592/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 8.3419045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43127 samples/s/p 2:00:29 } +2024-07-25 23:11:58,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1594/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 8.33649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:58,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.42999 samples/s/p 2:00:28 } +2024-07-25 23:12:01,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1596/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 8.3310715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:01,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43967 samples/s/p 2:00:12 } +2024-07-25 23:12:04,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1598/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.325661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:04,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43472 samples/s/p 2:00:15 } +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.320248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43536 samples/s/p 2:00:12 } +2024-07-25 23:12:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1602/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 8.314836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43706 samples/s/p 2:00:06 } +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1604/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 8.3094255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43881 samples/s/p 2:00:01 } +2024-07-25 23:12:16,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1606/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 8.304017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43453 samples/s/p 2:00:04 } +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1608/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 8.298609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:19,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43060 samples/s/p 2:00:06 } +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1610/ 1625], loss: 0.941, per_step_time: 1471ms, lr: 8.293203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43658 samples/s/p 1:59:55 } +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1612/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.287798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43978 samples/s/p 1:59:48 } +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1614/ 1625], loss: 1.266, per_step_time: 1476ms, lr: 8.282394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.41723 samples/s/p 2:00:15 } +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1616/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 8.276991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43091 samples/s/p 1:59:54 } +2024-07-25 23:12:33,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1618/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.271591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:33,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43544 samples/s/p 1:59:45 } +2024-07-25 23:12:36,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1620/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 8.266191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43759 samples/s/p 1:59:39 } +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1622/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 8.260793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43797 samples/s/p 1:59:36 } +2024-07-25 23:12:42,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1624/ 1625], loss: 1.285, per_step_time: 1474ms, lr: 8.255394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:42,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.42391 samples/s/p 1:59:51 } +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 8.250003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43760 samples/s/p 1:59:30 } +2024-07-25 23:12:48,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 3/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 8.244605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:48,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43494 samples/s/p 1:59:31 } +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 5/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 8.239212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43316 samples/s/p 1:59:30 } +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 7/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 8.233824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.44008 samples/s/p 1:59:18 } +2024-07-25 23:12:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 9/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 8.2284305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:57,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43570 samples/s/p 1:59:21 } +2024-07-25 23:13:00,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 11/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 8.223042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:00,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43859 samples/s/p 1:59:14 } +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 13/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 8.217657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43774 samples/s/p 1:59:12 } +2024-07-25 23:13:06,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 15/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 8.212267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:06,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43552 samples/s/p 1:59:12 } +2024-07-25 23:13:09,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 17/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.2068855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:09,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43266 samples/s/p 1:59:13 } +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 19/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.201501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43696 samples/s/p 1:59:05 } +2024-07-25 23:13:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 21/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 8.196116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:15,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.44044 samples/s/p 1:58:57 } +2024-07-25 23:13:18,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 23/ 1625], loss: 1.287, per_step_time: 1475ms, lr: 8.190739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.42277 samples/s/p 1:59:17 } +2024-07-25 23:13:20,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 25/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 8.185359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43435 samples/s/p 1:58:59 } +2024-07-25 23:13:23,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 27/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.179981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43835 samples/s/p 1:58:51 } +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 29/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 8.174604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43742 samples/s/p 1:58:49 } +2024-07-25 23:13:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 31/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 8.169228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:29,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43173 samples/s/p 1:58:54 } +2024-07-25 23:13:32,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 33/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.163854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:32,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43659 samples/s/p 1:58:45 } +2024-07-25 23:13:35,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 35/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 8.158482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:35,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43409 samples/s/p 1:58:45 } +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 37/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.153111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43655 samples/s/p 1:58:39 } +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 39/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 8.14774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43549 samples/s/p 1:58:37 } +2024-07-25 23:13:44,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 41/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 8.1423705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43702 samples/s/p 1:58:32 } +2024-07-25 23:13:47,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 43/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 8.1370035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:47,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43877 samples/s/p 1:58:27 } +2024-07-25 23:13:50,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 45/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 8.13164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:50,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43683 samples/s/p 1:58:27 } +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 47/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 8.126273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43481 samples/s/p 1:58:26 } +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 49/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 8.120909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42258 samples/s/p 1:58:39 } +2024-07-25 23:13:59,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 51/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 8.11555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43340 samples/s/p 1:58:22 } +2024-07-25 23:14:02,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 53/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 8.110187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:02,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42029 samples/s/p 1:58:36 } +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 55/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 8.104828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43619 samples/s/p 1:58:13 } +2024-07-25 23:14:08,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 57/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 8.099473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43312 samples/s/p 1:58:14 } +2024-07-25 23:14:11,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 59/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 8.094114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:11,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43782 samples/s/p 1:58:05 } +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 61/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 8.088761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43923 samples/s/p 1:58:00 } +2024-07-25 23:14:17,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 63/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 8.083408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43896 samples/s/p 1:57:57 } +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 65/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 8.078052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43385 samples/s/p 1:58:01 } +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 67/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 8.072704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43908 samples/s/p 1:57:51 } +2024-07-25 23:14:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 69/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 8.067355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:25,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43202 samples/s/p 1:57:58 } +2024-07-25 23:14:28,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 71/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 8.062004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43986 samples/s/p 1:57:44 } +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 73/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 8.05666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43215 samples/s/p 1:57:51 } +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 75/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.051315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43249 samples/s/p 1:57:48 } +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 77/ 1625], loss: 0.892, per_step_time: 1470ms, lr: 8.0459695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.44034 samples/s/p 1:57:35 } +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 79/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 8.040627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42754 samples/s/p 1:57:49 } +2024-07-25 23:14:43,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 81/ 1625], loss: 1.188, per_step_time: 1475ms, lr: 8.035286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:43,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42099 samples/s/p 1:57:54 } +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 83/ 1625], loss: 0.976, per_step_time: 1473ms, lr: 8.029945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42885 samples/s/p 1:57:41 } +2024-07-25 23:14:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 85/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 8.024606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:49,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43280 samples/s/p 1:57:33 } +2024-07-25 23:14:52,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 87/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 8.019269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:52,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43613 samples/s/p 1:57:26 } +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 89/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.013937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43505 samples/s/p 1:57:24 } +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 91/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 8.008599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43273 samples/s/p 1:57:24 } +2024-07-25 23:15:01,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 93/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 8.003266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43517 samples/s/p 1:57:18 } +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 95/ 1625], loss: 1.204, per_step_time: 1468ms, lr: 7.997937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.44737 samples/s/p 1:56:59 } +2024-07-25 23:15:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 97/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 7.992605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43527 samples/s/p 1:57:12 } +2024-07-25 23:15:10,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 99/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 7.987275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:10,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43311 samples/s/p 1:57:12 } +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 101/ 1625], loss: 0.903, per_step_time: 1473ms, lr: 7.981951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.42981 samples/s/p 1:57:13 } +2024-07-25 23:15:16,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 103/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 7.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43691 samples/s/p 1:57:01 } +2024-07-25 23:15:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 105/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 7.9713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:19,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43420 samples/s/p 1:57:02 } +2024-07-25 23:15:21,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 7.965976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43771 samples/s/p 1:56:54 } +2024-07-25 23:15:24,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 109/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 7.960652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:24,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42960 samples/s/p 1:57:02 } +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 111/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 7.955334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:27,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.44033 samples/s/p 1:56:45 } +2024-07-25 23:15:30,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 113/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 7.950014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:30,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43880 samples/s/p 1:56:44 } +2024-07-25 23:15:33,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 115/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 7.944696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43972 samples/s/p 1:56:40 } +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 117/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.93938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43413 samples/s/p 1:56:44 } +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 119/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 7.934065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43414 samples/s/p 1:56:41 } +2024-07-25 23:15:42,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 121/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 7.928752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42795 samples/s/p 1:56:46 } +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 123/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 7.923439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44307 samples/s/p 1:56:24 } +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.918128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44060 samples/s/p 1:56:24 } +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 127/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 7.912819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43218 samples/s/p 1:56:32 } +2024-07-25 23:15:54,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 129/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 7.907511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:54,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43083 samples/s/p 1:56:31 } +2024-07-25 23:15:57,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 131/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 7.902204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43081 samples/s/p 1:56:28 } +2024-07-25 23:16:00,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 133/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 7.8969015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43824 samples/s/p 1:56:15 } +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 135/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 7.8915955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43765 samples/s/p 1:56:13 } +2024-07-25 23:16:06,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 137/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 7.886293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:06,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43801 samples/s/p 1:56:10 } +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 139/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 7.880994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43445 samples/s/p 1:56:11 } +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 141/ 1625], loss: 0.940, per_step_time: 1471ms, lr: 7.875692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43511 samples/s/p 1:56:08 } +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 143/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 7.870396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43968 samples/s/p 1:55:59 } +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 145/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.8651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44049 samples/s/p 1:55:55 } +2024-07-25 23:16:20,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 147/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 7.859801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:20,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.42818 samples/s/p 1:56:08 } +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 149/ 1625], loss: 0.906, per_step_time: 1470ms, lr: 7.85451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43893 samples/s/p 1:55:51 } +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 151/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 7.8492185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43685 samples/s/p 1:55:51 } +2024-07-25 23:16:29,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 153/ 1625], loss: 1.019, per_step_time: 1471ms, lr: 7.843923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43511 samples/s/p 1:55:50 } +2024-07-25 23:16:32,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 155/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.838637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:32,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43876 samples/s/p 1:55:42 } +2024-07-25 23:16:35,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 157/ 1625], loss: 1.018, per_step_time: 1472ms, lr: 7.833349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43362 samples/s/p 1:55:46 } +2024-07-25 23:16:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 159/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 7.828062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43809 samples/s/p 1:55:37 } +2024-07-25 23:16:41,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 161/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 7.822776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:41,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43728 samples/s/p 1:55:35 } +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 163/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 7.817492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43368 samples/s/p 1:55:37 } +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 165/ 1625], loss: 1.167, per_step_time: 1469ms, lr: 7.812209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.44513 samples/s/p 1:55:19 } +2024-07-25 23:16:50,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 167/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 7.806928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:50,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43919 samples/s/p 1:55:24 } +2024-07-25 23:16:53,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 169/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 7.801648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43071 samples/s/p 1:55:32 } +2024-07-25 23:16:56,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 171/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 7.7963705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43588 samples/s/p 1:55:22 } +2024-07-25 23:16:59,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 173/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 7.791093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:59,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.42946 samples/s/p 1:55:28 } +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 175/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 7.785818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44239 samples/s/p 1:55:08 } +2024-07-25 23:17:05,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 177/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 7.780546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:05,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44137 samples/s/p 1:55:07 } +2024-07-25 23:17:08,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 179/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 7.77527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:08,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43886 samples/s/p 1:55:07 } +2024-07-25 23:17:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 181/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 7.77e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44231 samples/s/p 1:55:00 } +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 183/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.764732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43925 samples/s/p 1:55:00 } +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 185/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 7.7594605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44024 samples/s/p 1:54:56 } +2024-07-25 23:17:19,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 187/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.754196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44118 samples/s/p 1:54:52 } +2024-07-25 23:17:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 189/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 7.748931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:22,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.42988 samples/s/p 1:55:04 } +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 191/ 1625], loss: 1.170, per_step_time: 1469ms, lr: 7.743663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44433 samples/s/p 1:54:42 } +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 193/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 7.738405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43139 samples/s/p 1:54:56 } +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 195/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 7.733143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43103 samples/s/p 1:54:53 } +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 197/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 7.72788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43108 samples/s/p 1:54:50 } +2024-07-25 23:17:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 199/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 7.722625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43734 samples/s/p 1:54:39 } +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 201/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 7.717367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43248 samples/s/p 1:54:43 } +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 203/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 7.712112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43569 samples/s/p 1:54:36 } +2024-07-25 23:17:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 205/ 1625], loss: 0.943, per_step_time: 1471ms, lr: 7.706858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:46,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43574 samples/s/p 1:54:33 } +2024-07-25 23:17:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 207/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 7.701605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43297 samples/s/p 1:54:33 } +2024-07-25 23:17:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 209/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 7.696354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:52,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.42929 samples/s/p 1:54:35 } +2024-07-25 23:17:55,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 211/ 1625], loss: 1.014, per_step_time: 1477ms, lr: 7.691104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:55,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.41304 samples/s/p 1:54:52 } +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 213/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 7.685856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43340 samples/s/p 1:54:24 } +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 215/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 7.680609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.44160 samples/s/p 1:54:10 } +2024-07-25 23:18:04,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 217/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 7.675363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:04,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43448 samples/s/p 1:54:16 } +2024-07-25 23:18:07,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 219/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 7.67012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43437 samples/s/p 1:54:14 } +2024-07-25 23:18:10,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 221/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 7.664877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:10,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43899 samples/s/p 1:54:05 } +2024-07-25 23:18:13,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 223/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 7.659636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:13,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.42954 samples/s/p 1:54:14 } +2024-07-25 23:18:16,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 225/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.654396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43946 samples/s/p 1:53:58 } +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 227/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 7.649158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43739 samples/s/p 1:53:58 } +2024-07-25 23:18:21,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 229/ 1625], loss: 0.986, per_step_time: 1482ms, lr: 7.643921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.39546 samples/s/p 1:54:48 } +2024-07-25 23:18:24,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 231/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 7.638689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44057 samples/s/p 1:53:48 } +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 233/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 7.6334545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44119 samples/s/p 1:53:44 } +2024-07-25 23:18:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 235/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.628219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43262 samples/s/p 1:53:52 } +2024-07-25 23:18:33,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 7.6229917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43596 samples/s/p 1:53:45 } +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 239/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 7.617762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43422 samples/s/p 1:53:44 } +2024-07-25 23:18:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 241/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 7.6125307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:39,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43188 samples/s/p 1:53:44 } +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 243/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 7.607307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43286 samples/s/p 1:53:40 } +2024-07-25 23:18:45,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.602082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:45,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43259 samples/s/p 1:53:38 } +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 247/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 7.5968583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43927 samples/s/p 1:53:26 } +2024-07-25 23:18:51,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 249/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 7.5916355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.44074 samples/s/p 1:53:22 } +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 251/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.586415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43750 samples/s/p 1:53:23 } +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 253/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 7.581196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43639 samples/s/p 1:53:21 } +2024-07-25 23:19:00,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 255/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 7.575978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44080 samples/s/p 1:53:13 } +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 257/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 7.5707617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44095 samples/s/p 1:53:09 } +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 259/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 7.5655466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43054 samples/s/p 1:53:20 } +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 261/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 7.5603334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43498 samples/s/p 1:53:11 } +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 263/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 7.555121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43989 samples/s/p 1:53:02 } +2024-07-25 23:19:15,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 265/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 7.54991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:15,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44016 samples/s/p 1:52:59 } +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 267/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 7.5447015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43483 samples/s/p 1:53:02 } +2024-07-25 23:19:20,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 269/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.5394933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:20,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43265 samples/s/p 1:53:02 } +2024-07-25 23:19:23,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 271/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.5342878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43522 samples/s/p 1:52:56 } +2024-07-25 23:19:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 273/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 7.529083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:26,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43548 samples/s/p 1:52:53 } +2024-07-25 23:19:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 275/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.5238827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43794 samples/s/p 1:52:47 } +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 277/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 7.518678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43896 samples/s/p 1:52:43 } +2024-07-25 23:19:35,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 279/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 7.513478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43540 samples/s/p 1:52:44 } +2024-07-25 23:19:38,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 281/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 7.508282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:38,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43368 samples/s/p 1:52:43 } +2024-07-25 23:19:41,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 283/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 7.5030853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43765 samples/s/p 1:52:35 } +2024-07-25 23:19:44,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 285/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 7.4978893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43981 samples/s/p 1:52:30 } +2024-07-25 23:19:47,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 287/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 7.492694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43854 samples/s/p 1:52:28 } +2024-07-25 23:19:50,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 289/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 7.4875015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:50,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43331 samples/s/p 1:52:32 } +2024-07-25 23:19:53,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 291/ 1625], loss: 1.135, per_step_time: 1475ms, lr: 7.4823097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42160 samples/s/p 1:52:44 } +2024-07-25 23:19:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 293/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.4771206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:56,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43280 samples/s/p 1:52:27 } +2024-07-25 23:19:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 295/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 7.471932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:59,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44153 samples/s/p 1:52:13 } +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 297/ 1625], loss: 1.064, per_step_time: 1473ms, lr: 7.4667446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42814 samples/s/p 1:52:27 } +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 299/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 7.4615587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43810 samples/s/p 1:52:11 } +2024-07-25 23:20:08,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 301/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 7.456376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:08,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43539 samples/s/p 1:52:12 } +2024-07-25 23:20:11,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 303/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 7.4511927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:11,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43410 samples/s/p 1:52:10 } +2024-07-25 23:20:14,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 305/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 7.446012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43574 samples/s/p 1:52:05 } +2024-07-25 23:20:17,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 307/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 7.4408326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42752 samples/s/p 1:52:13 } +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 309/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 7.435654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42831 samples/s/p 1:52:09 } +2024-07-25 23:20:22,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 311/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 7.430478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43732 samples/s/p 1:51:55 } +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 313/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 7.4253053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43817 samples/s/p 1:51:51 } +2024-07-25 23:20:28,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 315/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 7.4201294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:28,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43919 samples/s/p 1:51:46 } +2024-07-25 23:20:31,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 317/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 7.4149575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43396 samples/s/p 1:51:50 } +2024-07-25 23:20:34,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 319/ 1625], loss: 0.999, per_step_time: 1469ms, lr: 7.4097893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:34,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.44292 samples/s/p 1:51:36 } +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 321/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 7.4046175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43035 samples/s/p 1:51:48 } +2024-07-25 23:20:40,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 323/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 7.39945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.42549 samples/s/p 1:51:52 } +2024-07-25 23:20:43,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 325/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.394287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43451 samples/s/p 1:51:37 } +2024-07-25 23:20:46,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 327/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.389119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43636 samples/s/p 1:51:32 } +2024-07-25 23:20:49,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 329/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 7.3839587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:49,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43265 samples/s/p 1:51:34 } +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 331/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 7.3787974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43418 samples/s/p 1:51:29 } +2024-07-25 23:20:55,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 333/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 7.373637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43371 samples/s/p 1:51:27 } +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 335/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 7.368479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43409 samples/s/p 1:51:23 } +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 337/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.363322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43973 samples/s/p 1:51:13 } +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 339/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 7.3581655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43831 samples/s/p 1:51:12 } +2024-07-25 23:21:07,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 341/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 7.353012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:07,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43945 samples/s/p 1:51:08 } +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 343/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 7.347859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.42754 samples/s/p 1:51:20 } +2024-07-25 23:21:13,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 345/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 7.342708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43254 samples/s/p 1:51:10 } +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 347/ 1625], loss: 1.077, per_step_time: 1469ms, lr: 7.337559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:16,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.44267 samples/s/p 1:50:55 } +2024-07-25 23:21:19,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 349/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 7.3324104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:19,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43369 samples/s/p 1:51:03 } +2024-07-25 23:21:21,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 351/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 7.3272636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:21,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44367 samples/s/p 1:50:48 } +2024-07-25 23:21:24,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 353/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 7.3221186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43263 samples/s/p 1:50:59 } +2024-07-25 23:21:27,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 355/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 7.3169754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44176 samples/s/p 1:50:44 } +2024-07-25 23:21:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 7.311836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:30,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43430 samples/s/p 1:50:51 } +2024-07-25 23:21:33,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 359/ 1625], loss: 1.053, per_step_time: 1476ms, lr: 7.3066926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:33,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.41978 samples/s/p 1:51:05 } +2024-07-25 23:21:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 361/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 7.3015535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:36,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44027 samples/s/p 1:50:37 } +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 363/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.296419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43678 samples/s/p 1:50:39 } +2024-07-25 23:21:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 365/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 7.29128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:42,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43643 samples/s/p 1:50:36 } +2024-07-25 23:21:45,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 367/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 7.2861453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:45,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43848 samples/s/p 1:50:31 } +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 369/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 7.2810158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43981 samples/s/p 1:50:26 } +2024-07-25 23:21:51,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 371/ 1625], loss: 1.237, per_step_time: 1469ms, lr: 7.275881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:51,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44433 samples/s/p 1:50:18 } +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 373/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 7.2707544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43472 samples/s/p 1:50:27 } +2024-07-25 23:21:57,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 375/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 7.2656258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43416 samples/s/p 1:50:24 } +2024-07-25 23:22:00,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 377/ 1625], loss: 1.169, per_step_time: 1469ms, lr: 7.2604957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:00,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44231 samples/s/p 1:50:11 } +2024-07-25 23:22:03,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 379/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 7.255374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:03,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43278 samples/s/p 1:50:20 } +2024-07-25 23:22:06,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 381/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 7.25025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:06,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43332 samples/s/p 1:50:16 } +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 383/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 7.245127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43652 samples/s/p 1:50:10 } +2024-07-25 23:22:12,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 385/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 7.2400067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:12,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43269 samples/s/p 1:50:11 } +2024-07-25 23:22:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 387/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 7.2348876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43231 samples/s/p 1:50:09 } +2024-07-25 23:22:18,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 389/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 7.2297703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.44113 samples/s/p 1:49:55 } +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 391/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 7.2246526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43780 samples/s/p 1:49:56 } +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 393/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 7.219539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.42716 samples/s/p 1:50:06 } +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 395/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 7.214425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43482 samples/s/p 1:49:54 } +2024-07-25 23:22:29,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 397/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 7.209314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43705 samples/s/p 1:49:48 } +2024-07-25 23:22:32,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 399/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 7.2042035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:32,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43324 samples/s/p 1:49:50 } +2024-07-25 23:22:35,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 401/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 7.199098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:35,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.42387 samples/s/p 1:49:58 } +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 403/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 7.1939876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43188 samples/s/p 1:49:46 } +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 405/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 7.1888826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43832 samples/s/p 1:49:35 } +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 407/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 7.183781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43666 samples/s/p 1:49:34 } +2024-07-25 23:22:47,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 409/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 7.1786762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43146 samples/s/p 1:49:37 } +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 411/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 7.1735753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43638 samples/s/p 1:49:29 } +2024-07-25 23:22:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 413/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 7.168479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:53,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43912 samples/s/p 1:49:22 } +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 415/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.163378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43675 samples/s/p 1:49:22 } +2024-07-25 23:22:59,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 417/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.158285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:59,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43960 samples/s/p 1:49:16 } +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 419/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 7.15319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43347 samples/s/p 1:49:20 } +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 421/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 7.148094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43474 samples/s/p 1:49:16 } +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 423/ 1625], loss: 1.299, per_step_time: 1470ms, lr: 7.1430045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43931 samples/s/p 1:49:07 } +2024-07-25 23:23:11,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 425/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 7.137915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:11,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43998 samples/s/p 1:49:04 } +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 427/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 7.1328236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43852 samples/s/p 1:49:02 } +2024-07-25 23:23:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 429/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 7.127739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:17,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43800 samples/s/p 1:49:00 } +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 431/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 7.1226536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42975 samples/s/p 1:49:07 } +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 433/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 7.117569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43665 samples/s/p 1:48:56 } +2024-07-25 23:23:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 435/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 7.1124873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43798 samples/s/p 1:48:51 } +2024-07-25 23:23:28,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 437/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 7.1074064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43766 samples/s/p 1:48:49 } +2024-07-25 23:23:31,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 439/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 7.102327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.44191 samples/s/p 1:48:41 } +2024-07-25 23:23:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 441/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 7.097249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:34,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43542 samples/s/p 1:48:46 } +2024-07-25 23:23:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 443/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 7.092173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43577 samples/s/p 1:48:42 } +2024-07-25 23:23:40,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 445/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 7.087101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42951 samples/s/p 1:48:47 } +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 447/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 7.082025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43575 samples/s/p 1:48:36 } +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 449/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 7.076954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43804 samples/s/p 1:48:31 } +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 451/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 7.0718866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43312 samples/s/p 1:48:34 } +2024-07-25 23:23:52,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 453/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 7.066815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43463 samples/s/p 1:48:29 } +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 455/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 7.061751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43562 samples/s/p 1:48:25 } +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 457/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 7.0566857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43718 samples/s/p 1:48:20 } +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 459/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 7.0516194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43369 samples/s/p 1:48:21 } +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 461/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 7.0465603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43375 samples/s/p 1:48:18 } +2024-07-25 23:24:07,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 463/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 7.0415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:07,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43966 samples/s/p 1:48:08 } +2024-07-25 23:24:10,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 465/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.0364367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43936 samples/s/p 1:48:06 } +2024-07-25 23:24:13,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 467/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 7.0313827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43479 samples/s/p 1:48:08 } +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 469/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 7.026327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43027 samples/s/p 1:48:11 } +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 471/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 7.0212723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43452 samples/s/p 1:48:03 } +2024-07-25 23:24:21,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 473/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 7.016219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43571 samples/s/p 1:47:58 } +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 475/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 7.0111682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43874 samples/s/p 1:47:52 } +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 477/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 7.0061183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43138 samples/s/p 1:47:57 } +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 479/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 7.00107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43279 samples/s/p 1:47:53 } +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 481/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.996024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43285 samples/s/p 1:47:50 } +2024-07-25 23:24:36,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 483/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 6.9909815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43102 samples/s/p 1:47:49 } +2024-07-25 23:24:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 485/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 6.985936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:39,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42744 samples/s/p 1:47:50 } +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 487/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 6.980893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43456 samples/s/p 1:47:39 } +2024-07-25 23:24:45,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 489/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.975856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:45,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43539 samples/s/p 1:47:35 } +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 491/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 6.970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42816 samples/s/p 1:47:41 } +2024-07-25 23:24:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 493/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 6.965778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:51,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43455 samples/s/p 1:47:30 } +2024-07-25 23:24:54,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 495/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 6.9607454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43009 samples/s/p 1:47:32 } +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 497/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 6.955708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43186 samples/s/p 1:47:27 } +2024-07-25 23:25:00,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 499/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 6.950678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43955 samples/s/p 1:47:15 } +2024-07-25 23:25:03,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 501/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 6.9456473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:03,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43242 samples/s/p 1:47:21 } +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 503/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 6.9406155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43130 samples/s/p 1:47:19 } +2024-07-25 23:25:09,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 505/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 6.9355906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:09,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43941 samples/s/p 1:47:07 } +2024-07-25 23:25:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 507/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 6.9305643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43356 samples/s/p 1:47:11 } +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 509/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 6.9255375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43966 samples/s/p 1:47:00 } +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 511/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 6.920517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43585 samples/s/p 1:47:02 } +2024-07-25 23:25:20,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 513/ 1625], loss: 1.141, per_step_time: 1477ms, lr: 6.9154958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.41610 samples/s/p 1:47:23 } +2024-07-25 23:25:23,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 515/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 6.910476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:23,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43210 samples/s/p 1:47:01 } +2024-07-25 23:25:26,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 517/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.905458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43138 samples/s/p 1:46:58 } +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 519/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.900441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43731 samples/s/p 1:46:49 } +2024-07-25 23:25:32,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 521/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 6.8954255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43983 samples/s/p 1:46:43 } +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 523/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 6.890413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43054 samples/s/p 1:46:51 } +2024-07-25 23:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 525/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 6.885401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:38,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43258 samples/s/p 1:46:45 } +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 527/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 6.880391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:41,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43156 samples/s/p 1:46:44 } +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 529/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 6.8753825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43547 samples/s/p 1:46:36 } +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 531/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 6.870375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43192 samples/s/p 1:46:37 } +2024-07-25 23:25:50,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 533/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 6.8653726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:50,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43446 samples/s/p 1:46:31 } +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 535/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 6.860366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43610 samples/s/p 1:46:26 } +2024-07-25 23:25:56,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 537/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 6.8553636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:56,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43598 samples/s/p 1:46:24 } +2024-07-25 23:25:59,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 539/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 6.8503664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:59,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43308 samples/s/p 1:46:24 } +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 541/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 6.8453637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43942 samples/s/p 1:46:14 } +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 543/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 6.840369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43923 samples/s/p 1:46:11 } +2024-07-25 23:26:08,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 545/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 6.835374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:08,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43596 samples/s/p 1:46:12 } +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 547/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 6.8303757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43216 samples/s/p 1:46:13 } +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 549/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 6.825386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43673 samples/s/p 1:46:05 } +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 551/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 6.8203954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43582 samples/s/p 1:46:03 } +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 553/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.815403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43230 samples/s/p 1:46:04 } +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 555/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 6.810418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:22,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43662 samples/s/p 1:45:56 } +2024-07-25 23:26:25,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 557/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 6.8054314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:25,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43979 samples/s/p 1:45:50 } +2024-07-25 23:26:28,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 559/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 6.800447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43237 samples/s/p 1:45:55 } +2024-07-25 23:26:31,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 561/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 6.795464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.42943 samples/s/p 1:45:56 } +2024-07-25 23:26:34,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 563/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.790483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:34,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43441 samples/s/p 1:45:47 } +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 565/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 6.785503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43454 samples/s/p 1:45:44 } +2024-07-25 23:26:40,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 567/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 6.780525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:40,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43078 samples/s/p 1:45:46 } +2024-07-25 23:26:43,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 569/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 6.7755473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:43,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43309 samples/s/p 1:45:40 } +2024-07-25 23:26:46,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 571/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 6.770573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:46,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43357 samples/s/p 1:45:36 } +2024-07-25 23:26:49,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 573/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 6.7655997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:49,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43493 samples/s/p 1:45:32 } +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 575/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.7606275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43553 samples/s/p 1:45:28 } +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 577/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 6.755657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43453 samples/s/p 1:45:26 } +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 579/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 6.7506894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43502 samples/s/p 1:45:23 } +2024-07-25 23:27:01,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 581/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 6.7457217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:01,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43015 samples/s/p 1:45:26 } +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 583/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 6.74076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.42919 samples/s/p 1:45:24 } +2024-07-25 23:27:07,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 585/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 6.735793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:07,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43471 samples/s/p 1:45:14 } +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 587/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 6.730834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43508 samples/s/p 1:45:11 } +2024-07-25 23:27:13,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 589/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.725873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:13,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43200 samples/s/p 1:45:12 } +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 591/ 1625], loss: 1.129, per_step_time: 1482ms, lr: 6.720911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.39653 samples/s/p 1:45:50 } +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 593/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 6.715957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43468 samples/s/p 1:45:03 } +2024-07-25 23:27:22,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 595/ 1625], loss: 0.980, per_step_time: 1471ms, lr: 6.7110013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:22,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43604 samples/s/p 1:44:58 } +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 597/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 6.7060473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43410 samples/s/p 1:44:58 } +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 599/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 6.701095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.44031 samples/s/p 1:44:47 } +2024-07-25 23:27:30,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 601/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 6.6961447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:30,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43808 samples/s/p 1:44:47 } +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 603/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 6.691195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43871 samples/s/p 1:44:43 } +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 605/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 6.686248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43646 samples/s/p 1:44:43 } +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 607/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 6.681302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43662 samples/s/p 1:44:40 } +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 609/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 6.6763573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.42560 samples/s/p 1:44:50 } +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 611/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 6.6714156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.44043 samples/s/p 1:44:30 } +2024-07-25 23:27:48,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 613/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 6.6664743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:48,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43690 samples/s/p 1:44:31 } +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 615/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43726 samples/s/p 1:44:27 } +2024-07-25 23:27:54,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 617/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 6.6565976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43496 samples/s/p 1:44:27 } +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 619/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.651661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43196 samples/s/p 1:44:28 } +2024-07-25 23:28:00,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 621/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 6.646727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:00,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43354 samples/s/p 1:44:23 } +2024-07-25 23:28:03,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 6.6417933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43438 samples/s/p 1:44:19 } +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 625/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 6.6368652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43791 samples/s/p 1:44:12 } +2024-07-25 23:28:09,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 627/ 1625], loss: 1.269, per_step_time: 1475ms, lr: 6.631933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:09,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42367 samples/s/p 1:44:25 } +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 629/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 6.627005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43776 samples/s/p 1:44:06 } +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 631/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 6.6220814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43655 samples/s/p 1:44:05 } +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 633/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 6.6171565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42889 samples/s/p 1:44:11 } +2024-07-25 23:28:21,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 635/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 6.612231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43375 samples/s/p 1:44:02 } +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 637/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 6.6073126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43464 samples/s/p 1:43:58 } +2024-07-25 23:28:26,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 639/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 6.602392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:26,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43601 samples/s/p 1:43:53 } +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 641/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 6.5974746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42952 samples/s/p 1:43:58 } +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 643/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 6.592558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.42925 samples/s/p 1:43:55 } +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 645/ 1625], loss: 0.951, per_step_time: 1473ms, lr: 6.587644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43076 samples/s/p 1:43:51 } +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.5827303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43499 samples/s/p 1:43:43 } +2024-07-25 23:28:41,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 649/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 6.5778186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:41,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43505 samples/s/p 1:43:40 } +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 651/ 1625], loss: 1.034, per_step_time: 1473ms, lr: 6.5729087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43052 samples/s/p 1:43:42 } +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 653/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 6.5680006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43702 samples/s/p 1:43:32 } +2024-07-25 23:28:50,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 655/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 6.5630943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:50,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43949 samples/s/p 1:43:26 } +2024-07-25 23:28:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 657/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 6.5581894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:53,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43704 samples/s/p 1:43:26 } +2024-07-25 23:28:56,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 659/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 6.5532854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:56,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43559 samples/s/p 1:43:25 } +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 661/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 6.548384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43214 samples/s/p 1:43:26 } +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 663/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 6.543484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.42893 samples/s/p 1:43:26 } +2024-07-25 23:29:05,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 665/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 6.538586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:05,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43376 samples/s/p 1:43:18 } +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 667/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.533689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43204 samples/s/p 1:43:17 } +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 669/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 6.5287973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43611 samples/s/p 1:43:09 } +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 671/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 6.5239014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43443 samples/s/p 1:43:08 } +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 673/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 6.5190097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43112 samples/s/p 1:43:09 } +2024-07-25 23:29:20,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 675/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 6.514122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43679 samples/s/p 1:43:00 } +2024-07-25 23:29:23,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 677/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.5092313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43678 samples/s/p 1:42:57 } +2024-07-25 23:29:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 679/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.5043446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43617 samples/s/p 1:42:54 } +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 681/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 6.4994624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43257 samples/s/p 1:42:56 } +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 683/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 6.4945793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44286 samples/s/p 1:42:41 } +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 685/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 6.489697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43128 samples/s/p 1:42:51 } +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 687/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 6.4848173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43294 samples/s/p 1:42:46 } +2024-07-25 23:29:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 689/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 6.4799387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44091 samples/s/p 1:42:34 } +2024-07-25 23:29:43,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 691/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 6.4750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:43,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44015 samples/s/p 1:42:32 } +2024-07-25 23:29:46,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 693/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 6.470187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44157 samples/s/p 1:42:28 } +2024-07-25 23:29:49,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 695/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 6.4653136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:49,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43361 samples/s/p 1:42:34 } +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 697/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 6.4604415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42870 samples/s/p 1:42:36 } +2024-07-25 23:29:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 699/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 6.4555716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43396 samples/s/p 1:42:28 } +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 701/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.450704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43576 samples/s/p 1:42:23 } +2024-07-25 23:30:01,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 703/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 6.4458363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:01,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42832 samples/s/p 1:42:28 } +2024-07-25 23:30:04,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 705/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 6.4409714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:04,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42807 samples/s/p 1:42:25 } +2024-07-25 23:30:07,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 707/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.4361084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:07,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42864 samples/s/p 1:42:22 } +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 709/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 6.4312467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43681 samples/s/p 1:42:10 } +2024-07-25 23:30:13,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 711/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 6.426387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.44199 samples/s/p 1:42:01 } +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 713/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.4215315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43539 samples/s/p 1:42:05 } +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 715/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 6.4166716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43399 samples/s/p 1:42:04 } +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 717/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.4118162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43612 samples/s/p 1:41:59 } +2024-07-25 23:30:24,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 719/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.406966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43376 samples/s/p 1:41:58 } +2024-07-25 23:30:27,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 721/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 6.4021115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:27,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42900 samples/s/p 1:42:01 } +2024-07-25 23:30:30,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 723/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 6.397261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43431 samples/s/p 1:41:52 } +2024-07-25 23:30:33,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 725/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.3924163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:33,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43517 samples/s/p 1:41:48 } +2024-07-25 23:30:36,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 727/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 6.387567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:36,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43106 samples/s/p 1:41:50 } +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 729/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.382725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43385 samples/s/p 1:41:43 } +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 731/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.3778816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43062 samples/s/p 1:41:44 } +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 733/ 1625], loss: 1.059, per_step_time: 1469ms, lr: 6.373039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.44359 samples/s/p 1:41:27 } +2024-07-25 23:30:48,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 735/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 6.3682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:48,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43682 samples/s/p 1:41:31 } +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 737/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 6.363362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43658 samples/s/p 1:41:29 } +2024-07-25 23:30:54,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 739/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 6.358525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43756 samples/s/p 1:41:25 } +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 741/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.353691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43766 samples/s/p 1:41:22 } +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 743/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 6.348857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43507 samples/s/p 1:41:21 } +2024-07-25 23:31:03,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 745/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 6.3440257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43671 samples/s/p 1:41:17 } +2024-07-25 23:31:06,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 747/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 6.3391963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:06,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43843 samples/s/p 1:41:12 } +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 749/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.334368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43775 samples/s/p 1:41:10 } +2024-07-25 23:31:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 751/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 6.3295415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:12,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43704 samples/s/p 1:41:08 } +2024-07-25 23:31:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 753/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 6.324717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:15,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43525 samples/s/p 1:41:07 } +2024-07-25 23:31:18,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 755/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 6.3198936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43435 samples/s/p 1:41:05 } +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 757/ 1625], loss: 1.036, per_step_time: 1470ms, lr: 6.3150756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43880 samples/s/p 1:40:57 } +2024-07-25 23:31:23,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 759/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 6.3102534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:23,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43576 samples/s/p 1:40:57 } +2024-07-25 23:31:26,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 761/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.3054354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:26,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43868 samples/s/p 1:40:51 } +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 763/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 6.3006214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43337 samples/s/p 1:40:54 } +2024-07-25 23:31:32,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 765/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 6.295804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43436 samples/s/p 1:40:50 } +2024-07-25 23:31:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 767/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.2909953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:35,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43636 samples/s/p 1:40:45 } +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 769/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 6.2861827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.42272 samples/s/p 1:40:57 } +2024-07-25 23:31:41,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 771/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 6.2813715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:41,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43561 samples/s/p 1:40:40 } +2024-07-25 23:31:44,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 773/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.276566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43570 samples/s/p 1:40:37 } +2024-07-25 23:31:47,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 775/ 1625], loss: 0.939, per_step_time: 1470ms, lr: 6.27176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:47,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44046 samples/s/p 1:40:28 } +2024-07-25 23:31:50,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 777/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 6.2669537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43381 samples/s/p 1:40:33 } +2024-07-25 23:31:53,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 779/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.262154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:53,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43146 samples/s/p 1:40:32 } +2024-07-25 23:31:56,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 781/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 6.2573527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43443 samples/s/p 1:40:26 } +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 783/ 1625], loss: 1.039, per_step_time: 1468ms, lr: 6.2525532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44626 samples/s/p 1:40:10 } +2024-07-25 23:32:02,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 785/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 6.2477557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:02,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43617 samples/s/p 1:40:18 } +2024-07-25 23:32:05,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 787/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 6.24296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43421 samples/s/p 1:40:18 } +2024-07-25 23:32:08,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 789/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.238167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43626 samples/s/p 1:40:12 } +2024-07-25 23:32:11,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 791/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 6.2333734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43600 samples/s/p 1:40:10 } +2024-07-25 23:32:14,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 793/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 6.228583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43279 samples/s/p 1:40:10 } +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 795/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 6.2237973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43965 samples/s/p 1:40:00 } +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 797/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 6.219008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43002 samples/s/p 1:40:08 } +2024-07-25 23:32:23,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 799/ 1625], loss: 1.374, per_step_time: 1471ms, lr: 6.214222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:23,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43846 samples/s/p 1:39:55 } +2024-07-25 23:32:25,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 801/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 6.2094405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43949 samples/s/p 1:39:51 } +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 803/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 6.2046556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42875 samples/s/p 1:40:00 } +2024-07-25 23:32:31,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 805/ 1625], loss: 1.395, per_step_time: 1471ms, lr: 6.1998753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43654 samples/s/p 1:39:49 } +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 807/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 6.1950996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.42647 samples/s/p 1:39:57 } +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 809/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.19032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43893 samples/s/p 1:39:40 } +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 811/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 6.1855476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43250 samples/s/p 1:39:44 } +2024-07-25 23:32:43,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 813/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 6.180774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43690 samples/s/p 1:39:36 } +2024-07-25 23:32:46,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 815/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.1759993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43283 samples/s/p 1:39:38 } +2024-07-25 23:32:49,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 817/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 6.1712317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:49,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43554 samples/s/p 1:39:32 } +2024-07-25 23:32:52,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 819/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 6.1664637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:52,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43767 samples/s/p 1:39:27 } +2024-07-25 23:32:55,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 821/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 6.1616947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43797 samples/s/p 1:39:23 } +2024-07-25 23:32:58,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.1569326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:58,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43710 samples/s/p 1:39:21 } +2024-07-25 23:33:01,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 825/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 6.1521696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:01,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43803 samples/s/p 1:39:18 } +2024-07-25 23:33:04,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 827/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 6.1474075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43363 samples/s/p 1:39:19 } +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 829/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.142649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43262 samples/s/p 1:39:18 } +2024-07-25 23:33:10,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 831/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 6.13789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:10,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43626 samples/s/p 1:39:11 } +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 833/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 6.1331343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43168 samples/s/p 1:39:13 } +2024-07-25 23:33:16,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 835/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.128379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.44093 samples/s/p 1:39:00 } +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 837/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 6.1236265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43555 samples/s/p 1:39:03 } +2024-07-25 23:33:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 839/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.118878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43559 samples/s/p 1:39:00 } +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 841/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 6.1141263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43042 samples/s/p 1:39:02 } +2024-07-25 23:33:27,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 843/ 1625], loss: 0.900, per_step_time: 1471ms, lr: 6.109379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43486 samples/s/p 1:38:55 } +2024-07-25 23:33:30,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 845/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 6.1046358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43447 samples/s/p 1:38:52 } +2024-07-25 23:33:33,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 847/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 6.099888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:33,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43149 samples/s/p 1:38:52 } +2024-07-25 23:33:36,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 849/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 6.095147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:36,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43231 samples/s/p 1:38:48 } +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 851/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 6.090408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43650 samples/s/p 1:38:41 } +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 853/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 6.085667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.44195 samples/s/p 1:38:32 } +2024-07-25 23:33:45,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 855/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 6.0809325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43898 samples/s/p 1:38:32 } +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 857/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.076197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43561 samples/s/p 1:38:33 } +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 859/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 6.071461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43836 samples/s/p 1:38:27 } +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 861/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.0667317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43266 samples/s/p 1:38:30 } +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 863/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 6.0620005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43541 samples/s/p 1:38:24 } +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 865/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 6.0572706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43609 samples/s/p 1:38:21 } +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 867/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 6.0525454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.44209 samples/s/p 1:38:11 } +2024-07-25 23:34:06,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 869/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 6.0478205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43720 samples/s/p 1:38:14 } +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 871/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 6.0430975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43924 samples/s/p 1:38:09 } +2024-07-25 23:34:12,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 873/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.038376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:12,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43591 samples/s/p 1:38:09 } +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 875/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.033657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43356 samples/s/p 1:38:09 } +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 877/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 6.028938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43570 samples/s/p 1:38:04 } +2024-07-25 23:34:21,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 879/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 6.024223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:21,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43456 samples/s/p 1:38:02 } +2024-07-25 23:34:23,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 881/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 6.019508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43584 samples/s/p 1:37:58 } +2024-07-25 23:34:26,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 883/ 1625], loss: 0.990, per_step_time: 1469ms, lr: 6.0147977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:26,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.44235 samples/s/p 1:37:48 } +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 885/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 6.0100842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.42832 samples/s/p 1:38:00 } +2024-07-25 23:34:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 887/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 6.005375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42798 samples/s/p 1:37:57 } +2024-07-25 23:34:35,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 889/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.0006705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:35,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43625 samples/s/p 1:37:45 } +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 891/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 5.995962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43024 samples/s/p 1:37:49 } +2024-07-25 23:34:41,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 893/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 5.9912577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:41,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42993 samples/s/p 1:37:46 } +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 895/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 5.986558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43044 samples/s/p 1:37:43 } +2024-07-25 23:34:47,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 897/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 5.9818544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:47,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43535 samples/s/p 1:37:35 } +2024-07-25 23:34:50,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 899/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 5.9771587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:50,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43287 samples/s/p 1:37:34 } +2024-07-25 23:34:53,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 901/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 5.9724625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:53,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43087 samples/s/p 1:37:33 } +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 903/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 5.9677636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43698 samples/s/p 1:37:24 } +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 905/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 5.963073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43476 samples/s/p 1:37:23 } +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 907/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 5.958381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43195 samples/s/p 1:37:23 } +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 909/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 5.9536887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43566 samples/s/p 1:37:17 } +2024-07-25 23:35:08,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 911/ 1625], loss: 0.999, per_step_time: 1473ms, lr: 5.9490035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:08,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43026 samples/s/p 1:37:19 } +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 913/ 1625], loss: 1.011, per_step_time: 1474ms, lr: 5.944317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.42634 samples/s/p 1:37:21 } +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 915/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 5.9396325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43448 samples/s/p 1:37:09 } +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 917/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 5.93495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.44356 samples/s/p 1:36:56 } +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 919/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 5.930269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.44102 samples/s/p 1:36:56 } +2024-07-25 23:35:23,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 921/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 5.92559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43381 samples/s/p 1:37:01 } +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 923/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.9209115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43246 samples/s/p 1:36:59 } +2024-07-25 23:35:28,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 925/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.9162358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:28,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43419 samples/s/p 1:36:55 } +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 927/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 5.911562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43754 samples/s/p 1:36:48 } +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 929/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 5.90689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43318 samples/s/p 1:36:50 } +2024-07-25 23:35:37,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 931/ 1625], loss: 0.982, per_step_time: 1473ms, lr: 5.902219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43101 samples/s/p 1:36:49 } +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 933/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 5.897553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.42701 samples/s/p 1:36:50 } +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 935/ 1625], loss: 1.269, per_step_time: 1470ms, lr: 5.8928836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.44010 samples/s/p 1:36:34 } +2024-07-25 23:35:46,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 937/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 5.8882206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:46,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43655 samples/s/p 1:36:34 } +2024-07-25 23:35:49,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 939/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 5.883558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43007 samples/s/p 1:36:38 } +2024-07-25 23:35:52,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 941/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 5.8788933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:52,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43155 samples/s/p 1:36:34 } +2024-07-25 23:35:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 943/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.8742357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:55,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43709 samples/s/p 1:36:25 } +2024-07-25 23:35:58,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 945/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 5.8695773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43087 samples/s/p 1:36:29 } +2024-07-25 23:36:01,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 947/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.8649184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:01,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43785 samples/s/p 1:36:18 } +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 949/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 5.8602677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43379 samples/s/p 1:36:20 } +2024-07-25 23:36:07,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 951/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 5.8556143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:07,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43574 samples/s/p 1:36:15 } +2024-07-25 23:36:10,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 953/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 5.8509636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:10,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43647 samples/s/p 1:36:11 } +2024-07-25 23:36:13,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 955/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.8463143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:13,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43762 samples/s/p 1:36:07 } +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 957/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.8416667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43334 samples/s/p 1:36:08 } +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 959/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 5.8370215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43244 samples/s/p 1:36:06 } +2024-07-25 23:36:22,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 961/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 5.8323767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43157 samples/s/p 1:36:04 } +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 963/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 5.8277355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42748 samples/s/p 1:36:06 } +2024-07-25 23:36:27,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 965/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 5.8230953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42961 samples/s/p 1:36:01 } +2024-07-25 23:36:30,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 967/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.818457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43278 samples/s/p 1:35:54 } +2024-07-25 23:36:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 969/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 5.8138203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:33,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43886 samples/s/p 1:35:45 } +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 971/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 5.809185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.44016 samples/s/p 1:35:41 } +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 973/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 5.8045516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43659 samples/s/p 1:35:41 } +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 975/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.799921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43271 samples/s/p 1:35:42 } +2024-07-25 23:36:45,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 977/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 5.795291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:45,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43371 samples/s/p 1:35:38 } +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 979/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 5.790663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43549 samples/s/p 1:35:34 } +2024-07-25 23:36:51,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 981/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.78604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:51,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43378 samples/s/p 1:35:33 } +2024-07-25 23:36:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 983/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.7814163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:54,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43625 samples/s/p 1:35:27 } +2024-07-25 23:36:57,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 985/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 5.7767907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44121 samples/s/p 1:35:19 } +2024-07-25 23:37:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 987/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 5.7721727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43663 samples/s/p 1:35:21 } +2024-07-25 23:37:03,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 989/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 5.7675543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43605 samples/s/p 1:35:18 } +2024-07-25 23:37:06,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 991/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.7629345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43723 samples/s/p 1:35:14 } +2024-07-25 23:37:09,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 993/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 5.758322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:09,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43286 samples/s/p 1:35:16 } +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 995/ 1625], loss: 1.058, per_step_time: 1469ms, lr: 5.7537086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44290 samples/s/p 1:35:02 } +2024-07-25 23:37:15,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 997/ 1625], loss: 1.046, per_step_time: 1473ms, lr: 5.749097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.42955 samples/s/p 1:35:13 } +2024-07-25 23:37:18,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 999/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 5.7444868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43483 samples/s/p 1:35:05 } +2024-07-25 23:37:21,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1001/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 5.7398797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:21,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43884 samples/s/p 1:34:58 } +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1003/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 5.735274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44057 samples/s/p 1:34:53 } +2024-07-25 23:37:26,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1005/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 5.730669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:26,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43771 samples/s/p 1:34:53 } +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1007/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 5.726067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43343 samples/s/p 1:34:55 } +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1009/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 5.7214656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.42934 samples/s/p 1:34:56 } +2024-07-25 23:37:35,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1011/ 1625], loss: 1.017, per_step_time: 1469ms, lr: 5.716867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:35,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44223 samples/s/p 1:34:40 } +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1013/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 5.7122697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43726 samples/s/p 1:34:42 } +2024-07-25 23:37:41,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1015/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 5.7076745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:41,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43567 samples/s/p 1:34:40 } +2024-07-25 23:37:44,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1017/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 5.7030807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43358 samples/s/p 1:34:40 } +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1019/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 5.698489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43083 samples/s/p 1:34:40 } +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1021/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 5.693899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43672 samples/s/p 1:34:31 } +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1023/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.6893105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43648 samples/s/p 1:34:28 } +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1025/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 5.684727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43579 samples/s/p 1:34:26 } +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1027/ 1625], loss: 0.913, per_step_time: 1475ms, lr: 5.6801396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42368 samples/s/p 1:34:35 } +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1029/ 1625], loss: 1.008, per_step_time: 1474ms, lr: 5.675557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42728 samples/s/p 1:34:29 } +2024-07-25 23:38:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1031/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 5.670979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:05,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42697 samples/s/p 1:34:26 } +2024-07-25 23:38:08,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1033/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.6663994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:08,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43798 samples/s/p 1:34:12 } +2024-07-25 23:38:11,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1035/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 5.6618196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43584 samples/s/p 1:34:11 } +2024-07-25 23:38:14,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1037/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 5.6572476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:14,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.44031 samples/s/p 1:34:03 } +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1039/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 5.652674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.42991 samples/s/p 1:34:11 } +2024-07-25 23:38:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1041/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 5.648102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:20,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43764 samples/s/p 1:34:00 } +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1043/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 5.643532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43687 samples/s/p 1:33:58 } +2024-07-25 23:38:25,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1045/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 5.6389636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43602 samples/s/p 1:33:56 } +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1047/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 5.6343974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:28,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43564 samples/s/p 1:33:53 } +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1049/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 5.629833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43696 samples/s/p 1:33:49 } +2024-07-25 23:38:34,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1051/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.6252698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43347 samples/s/p 1:33:50 } +2024-07-25 23:38:37,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1053/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 5.620709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:37,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43568 samples/s/p 1:33:45 } +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1055/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 5.616151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43678 samples/s/p 1:33:40 } +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1057/ 1625], loss: 0.878, per_step_time: 1472ms, lr: 5.6115937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43188 samples/s/p 1:33:43 } +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1059/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.607038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43432 samples/s/p 1:33:37 } +2024-07-25 23:38:49,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1061/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 5.602484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:49,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43628 samples/s/p 1:33:32 } +2024-07-25 23:38:52,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1063/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 5.597932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:52,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.44019 samples/s/p 1:33:25 } +2024-07-25 23:38:55,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1065/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 5.593383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.44041 samples/s/p 1:33:22 } +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1067/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 5.588834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43280 samples/s/p 1:33:27 } +2024-07-25 23:39:01,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1069/ 1625], loss: 1.022, per_step_time: 1476ms, lr: 5.5842916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42001 samples/s/p 1:33:37 } +2024-07-25 23:39:04,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1071/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.5797436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:04,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43667 samples/s/p 1:33:17 } +2024-07-25 23:39:07,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1073/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 5.575201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43106 samples/s/p 1:33:20 } +2024-07-25 23:39:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1075/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 5.570663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43561 samples/s/p 1:33:12 } +2024-07-25 23:39:13,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1077/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 5.566121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43983 samples/s/p 1:33:05 } +2024-07-25 23:39:16,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1079/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 5.5615847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:16,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42982 samples/s/p 1:33:12 } +2024-07-25 23:39:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1081/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 5.5570517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:19,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44009 samples/s/p 1:32:59 } +2024-07-25 23:39:22,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1083/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 5.5525184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:22,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43445 samples/s/p 1:33:02 } +2024-07-25 23:39:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1085/ 1625], loss: 0.930, per_step_time: 1470ms, lr: 5.5479873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44168 samples/s/p 1:32:51 } +2024-07-25 23:39:27,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1087/ 1625], loss: 0.904, per_step_time: 1471ms, lr: 5.5434575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:27,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43612 samples/s/p 1:32:54 } +2024-07-25 23:39:30,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1089/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 5.5389296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43820 samples/s/p 1:32:49 } +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1091/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 5.5344026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43598 samples/s/p 1:32:48 } +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1093/ 1625], loss: 1.225, per_step_time: 1473ms, lr: 5.5298788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43098 samples/s/p 1:32:51 } +2024-07-25 23:39:39,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1095/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 5.5253563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43691 samples/s/p 1:32:41 } +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1097/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.520836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43743 samples/s/p 1:32:38 } +2024-07-25 23:39:45,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1099/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.516317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43363 samples/s/p 1:32:39 } +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1101/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 5.5118003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43062 samples/s/p 1:32:39 } +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1103/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 5.507285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.42798 samples/s/p 1:32:39 } +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 5.502772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43500 samples/s/p 1:32:29 } +2024-07-25 23:39:57,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1107/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 5.4982634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:57,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43219 samples/s/p 1:32:29 } +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1109/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 5.493752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43316 samples/s/p 1:32:25 } +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 5.489244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43847 samples/s/p 1:32:16 } +2024-07-25 23:40:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1113/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.484741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43286 samples/s/p 1:32:19 } +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1115/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 5.4802344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44154 samples/s/p 1:32:07 } +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1117/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.475732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43832 samples/s/p 1:32:08 } +2024-07-25 23:40:15,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1119/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 5.471234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43462 samples/s/p 1:32:08 } +2024-07-25 23:40:18,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1121/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 5.466733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43322 samples/s/p 1:32:07 } +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1123/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.4622396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:21,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43486 samples/s/p 1:32:02 } +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1125/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 5.4577445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44169 samples/s/p 1:31:52 } +2024-07-25 23:40:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1127/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 5.4532497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43767 samples/s/p 1:31:54 } +2024-07-25 23:40:29,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1129/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 5.4487605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:29,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43348 samples/s/p 1:31:55 } +2024-07-25 23:40:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1473ms, lr: 5.4442717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43061 samples/s/p 1:31:55 } +2024-07-25 23:40:35,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1133/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 5.439784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:35,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43388 samples/s/p 1:31:49 } +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1135/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 5.4352986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43304 samples/s/p 1:31:47 } +2024-07-25 23:40:41,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1137/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 5.430815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43948 samples/s/p 1:31:37 } +2024-07-25 23:40:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1139/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 5.4263337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43051 samples/s/p 1:31:43 } +2024-07-25 23:40:47,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1141/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 5.4218544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:47,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44174 samples/s/p 1:31:29 } +2024-07-25 23:40:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1143/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 5.4173765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:50,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43874 samples/s/p 1:31:29 } +2024-07-25 23:40:53,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1145/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.4129005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:53,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43622 samples/s/p 1:31:29 } +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1147/ 1625], loss: 1.098, per_step_time: 1476ms, lr: 5.4084253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.41847 samples/s/p 1:31:44 } +2024-07-25 23:40:59,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1149/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 5.4039533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:59,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43476 samples/s/p 1:31:24 } +2024-07-25 23:41:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1151/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 5.3994845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43031 samples/s/p 1:31:26 } +2024-07-25 23:41:05,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1153/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 5.3950143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43618 samples/s/p 1:31:17 } +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1155/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 5.390547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.42877 samples/s/p 1:31:21 } +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1157/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.386085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43422 samples/s/p 1:31:13 } +2024-07-25 23:41:14,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1159/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 5.3816193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43979 samples/s/p 1:31:04 } +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1161/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 5.377158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43939 samples/s/p 1:31:02 } +2024-07-25 23:41:20,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1163/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 5.372701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43939 samples/s/p 1:30:59 } +2024-07-25 23:41:23,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1165/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.368241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:23,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43326 samples/s/p 1:31:02 } +2024-07-25 23:41:25,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1167/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 5.363788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:25,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43442 samples/s/p 1:30:58 } +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1169/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.359334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43693 samples/s/p 1:30:53 } +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1171/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 5.3548797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43770 samples/s/p 1:30:49 } +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1173/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 5.350432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43164 samples/s/p 1:30:52 } +2024-07-25 23:41:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1175/ 1625], loss: 1.012, per_step_time: 1471ms, lr: 5.3459844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43633 samples/s/p 1:30:44 } +2024-07-25 23:41:40,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1177/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.341535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:40,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43142 samples/s/p 1:30:46 } +2024-07-25 23:41:43,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1179/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 5.3370936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:43,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43659 samples/s/p 1:30:38 } +2024-07-25 23:41:46,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1181/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 5.3326517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43087 samples/s/p 1:30:41 } +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1183/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 5.328211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.42436 samples/s/p 1:30:45 } +2024-07-25 23:41:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1185/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.323772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43806 samples/s/p 1:30:28 } +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1187/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.319335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43584 samples/s/p 1:30:27 } +2024-07-25 23:41:58,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1189/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 5.3149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43582 samples/s/p 1:30:24 } +2024-07-25 23:42:01,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1191/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.3104673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:01,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43117 samples/s/p 1:30:26 } +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1193/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.306036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43204 samples/s/p 1:30:22 } +2024-07-25 23:42:07,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1195/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 5.301609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43493 samples/s/p 1:30:16 } +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1197/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 5.2971795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43640 samples/s/p 1:30:12 } +2024-07-25 23:42:13,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1199/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 5.2927535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43940 samples/s/p 1:30:06 } +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1201/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 5.288333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43895 samples/s/p 1:30:03 } +2024-07-25 23:42:19,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1203/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 5.2839086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:19,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43037 samples/s/p 1:30:09 } +2024-07-25 23:42:22,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1205/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.2794885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43577 samples/s/p 1:30:01 } +2024-07-25 23:42:25,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1207/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 5.275073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43485 samples/s/p 1:29:59 } +2024-07-25 23:42:27,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1209/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 5.270654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:27,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43518 samples/s/p 1:29:55 } +2024-07-25 23:42:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1211/ 1625], loss: 0.974, per_step_time: 1474ms, lr: 5.266243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:30,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42380 samples/s/p 1:30:04 } +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1213/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 5.2618298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43782 samples/s/p 1:29:47 } +2024-07-25 23:42:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1215/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.257417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43642 samples/s/p 1:29:45 } +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1217/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 5.253011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43591 samples/s/p 1:29:43 } +2024-07-25 23:42:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1219/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 5.248604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43262 samples/s/p 1:29:43 } +2024-07-25 23:42:45,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1221/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 5.244197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42790 samples/s/p 1:29:45 } +2024-07-25 23:42:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1223/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 5.2397972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43108 samples/s/p 1:29:39 } +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1225/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 5.2353953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42959 samples/s/p 1:29:37 } +2024-07-25 23:42:51,585 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1227/ 1625], loss: 0.972, per_step_time: 2101ms, lr: 5.230997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 3.80696 samples/s/p 2:07:45 } +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1229/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 5.226599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42791 samples/s/p 1:29:33 } +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1231/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 5.222204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43568 samples/s/p 1:29:23 } +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1233/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 5.21781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42967 samples/s/p 1:29:26 } +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1235/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 5.2134196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43406 samples/s/p 1:29:18 } +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1237/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 5.20903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43256 samples/s/p 1:29:17 } +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1239/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 5.204644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43742 samples/s/p 1:29:09 } +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1241/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 5.200256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43680 samples/s/p 1:29:07 } +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1243/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 5.1958723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43037 samples/s/p 1:29:10 } +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1245/ 1625], loss: 0.898, per_step_time: 1471ms, lr: 5.1914926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43681 samples/s/p 1:29:01 } +2024-07-25 23:43:56,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1247/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.1871107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:56,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43593 samples/s/p 1:28:59 } +2024-07-25 23:43:59,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1249/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.1827324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:59,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43598 samples/s/p 1:28:56 } +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1251/ 1625], loss: 1.108, per_step_time: 1476ms, lr: 5.178358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:02,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.41734 samples/s/p 1:29:11 } +2024-07-25 23:44:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1253/ 1625], loss: 1.395, per_step_time: 1472ms, lr: 5.1739808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43376 samples/s/p 1:28:52 } +2024-07-25 23:44:08,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1255/ 1625], loss: 1.357, per_step_time: 1470ms, lr: 5.169611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:08,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43850 samples/s/p 1:28:45 } +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1257/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 5.1652405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43514 samples/s/p 1:28:45 } +2024-07-25 23:44:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1259/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 5.1608695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43962 samples/s/p 1:28:38 } +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1261/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 5.1565053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43542 samples/s/p 1:28:39 } +2024-07-25 23:44:20,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1263/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.1521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43522 samples/s/p 1:28:36 } +2024-07-25 23:44:23,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1265/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 5.147777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:23,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44082 samples/s/p 1:28:28 } +2024-07-25 23:44:26,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1267/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 5.143416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.42869 samples/s/p 1:28:36 } +2024-07-25 23:44:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1269/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 5.1390575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:29,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44103 samples/s/p 1:28:21 } +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1271/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 5.1346997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43760 samples/s/p 1:28:22 } +2024-07-25 23:44:35,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1273/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 5.1303446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:35,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43594 samples/s/p 1:28:21 } +2024-07-25 23:44:38,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1275/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 5.1259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:38,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43657 samples/s/p 1:28:17 } +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1277/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 5.12164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42859 samples/s/p 1:28:22 } +2024-07-25 23:44:43,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1279/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.1172897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:43,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43399 samples/s/p 1:28:14 } +2024-07-25 23:44:46,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1281/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 5.1129427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:46,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43066 samples/s/p 1:28:14 } +2024-07-25 23:44:49,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1283/ 1625], loss: 0.895, per_step_time: 1470ms, lr: 5.108599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:49,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.44045 samples/s/p 1:28:01 } +2024-07-25 23:44:52,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1285/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 5.1042534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:53,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43943 samples/s/p 1:27:59 } +2024-07-25 23:44:56,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1287/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 5.099911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:56,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42410 samples/s/p 1:28:11 } +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1289/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 5.095573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43393 samples/s/p 1:27:59 } +2024-07-25 23:45:02,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1291/ 1625], loss: 1.193, per_step_time: 1475ms, lr: 5.091233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42071 samples/s/p 1:28:09 } +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1293/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.086899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43117 samples/s/p 1:27:56 } +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1295/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 5.082565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.44083 samples/s/p 1:27:43 } +2024-07-25 23:45:11,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1297/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 5.07823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:11,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43198 samples/s/p 1:27:49 } +2024-07-25 23:45:14,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1299/ 1625], loss: 1.252, per_step_time: 1475ms, lr: 5.073902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:14,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.42330 samples/s/p 1:27:55 } +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1301/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 5.0695744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43425 samples/s/p 1:27:41 } +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1303/ 1625], loss: 1.122, per_step_time: 1475ms, lr: 5.0652447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.42173 samples/s/p 1:27:50 } +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1305/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.0609233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43813 samples/s/p 1:27:31 } +2024-07-25 23:45:25,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1307/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 5.0566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:25,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.44006 samples/s/p 1:27:27 } +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1309/ 1625], loss: 1.139, per_step_time: 1477ms, lr: 5.05228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.41412 samples/s/p 1:27:49 } +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1311/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 5.0479603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43614 samples/s/p 1:27:24 } +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1313/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 5.043644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43101 samples/s/p 1:27:26 } +2024-07-25 23:45:37,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1315/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 5.0393287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:37,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43060 samples/s/p 1:27:24 } +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1317/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 5.035016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43363 samples/s/p 1:27:18 } +2024-07-25 23:45:43,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1319/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 5.030705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:43,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42839 samples/s/p 1:27:20 } +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1321/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 5.0263957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42996 samples/s/p 1:27:16 } +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1323/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.0220883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43814 samples/s/p 1:27:05 } +2024-07-25 23:45:52,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1325/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.017783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:52,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43274 samples/s/p 1:27:07 } +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1327/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 5.01348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42777 samples/s/p 1:27:09 } +2024-07-25 23:45:58,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1329/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 5.0091776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:58,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42628 samples/s/p 1:27:07 } +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1331/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 5.004879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42672 samples/s/p 1:27:04 } +2024-07-25 23:46:04,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1333/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.000584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:04,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43266 samples/s/p 1:26:55 } +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1335/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 4.9962855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:07,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42463 samples/s/p 1:27:00 } +2024-07-25 23:46:10,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1337/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 4.9919945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:10,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43842 samples/s/p 1:26:44 } +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1339/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 4.9877026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43371 samples/s/p 1:26:46 } +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1341/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 4.9834107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43630 samples/s/p 1:26:40 } +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1343/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 4.9791247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.42971 samples/s/p 1:26:43 } +2024-07-25 23:46:22,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1345/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.9748396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43619 samples/s/p 1:26:34 } +2024-07-25 23:46:25,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1347/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 4.9705527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:25,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43637 samples/s/p 1:26:31 } +2024-07-25 23:46:28,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1349/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 4.966273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:28,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43307 samples/s/p 1:26:31 } +2024-07-25 23:46:30,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1351/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 4.961993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:30,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43280 samples/s/p 1:26:29 } +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1353/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 4.957715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43736 samples/s/p 1:26:21 } +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1355/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 4.9534397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43656 samples/s/p 1:26:19 } +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1357/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 4.949165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43104 samples/s/p 1:26:22 } +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1359/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 4.9448927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43895 samples/s/p 1:26:11 } +2024-07-25 23:46:45,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1361/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 4.9406226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:45,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43759 samples/s/p 1:26:09 } +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1363/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 4.936354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43466 samples/s/p 1:26:09 } +2024-07-25 23:46:51,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1365/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 4.932088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:51,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43787 samples/s/p 1:26:03 } +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1367/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 4.9278233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43307 samples/s/p 1:26:05 } +2024-07-25 23:46:57,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1369/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 4.92356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:57,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43598 samples/s/p 1:25:59 } +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1371/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.919299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43030 samples/s/p 1:26:02 } +2024-07-25 23:47:03,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1373/ 1625], loss: 1.125, per_step_time: 1483ms, lr: 4.915041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.39440 samples/s/p 1:26:33 } +2024-07-25 23:47:06,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1375/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 4.9107844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:06,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43903 samples/s/p 1:25:47 } +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1377/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 4.9065297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:09,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43104 samples/s/p 1:25:52 } +2024-07-25 23:47:12,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1379/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 4.9022765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:12,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43282 samples/s/p 1:25:47 } +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1381/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 4.8980287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43884 samples/s/p 1:25:39 } +2024-07-25 23:47:18,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1383/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 4.8937773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:18,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43465 samples/s/p 1:25:40 } +2024-07-25 23:47:21,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1385/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 4.8895304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43340 samples/s/p 1:25:38 } +2024-07-25 23:47:24,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1387/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 4.8852876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:24,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.42931 samples/s/p 1:25:39 } +2024-07-25 23:47:27,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1389/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 4.881045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43632 samples/s/p 1:25:29 } +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1391/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 4.8768015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43005 samples/s/p 1:25:32 } +2024-07-25 23:47:32,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1393/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 4.8725647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:32,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43032 samples/s/p 1:25:29 } +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1395/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 4.8683273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.44108 samples/s/p 1:25:16 } +2024-07-25 23:47:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1397/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 4.8640923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:38,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43952 samples/s/p 1:25:15 } +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1399/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.85986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43126 samples/s/p 1:25:19 } +2024-07-25 23:47:44,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1401/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 4.8556276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:44,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43063 samples/s/p 1:25:17 } +2024-07-25 23:47:47,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1403/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 4.851399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:47,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43258 samples/s/p 1:25:12 } +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1405/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 4.8471716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43395 samples/s/p 1:25:08 } +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1407/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 4.8429465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43236 samples/s/p 1:25:07 } +2024-07-25 23:47:56,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1409/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 4.8387237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:56,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43768 samples/s/p 1:24:59 } +2024-07-25 23:47:59,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1411/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 4.8345014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:59,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43616 samples/s/p 1:24:57 } +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1413/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.8302823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43433 samples/s/p 1:24:56 } +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1415/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 4.8260645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43885 samples/s/p 1:24:49 } +2024-07-25 23:48:08,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1417/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.8218494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43411 samples/s/p 1:24:50 } +2024-07-25 23:48:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1419/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 4.817638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:11,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43505 samples/s/p 1:24:46 } +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1421/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 4.8134248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:14,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43723 samples/s/p 1:24:42 } +2024-07-25 23:48:17,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1423/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 4.809215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:17,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43690 samples/s/p 1:24:39 } +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1425/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 4.8050097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43385 samples/s/p 1:24:39 } +2024-07-25 23:48:23,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1427/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.8008023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43682 samples/s/p 1:24:33 } +2024-07-25 23:48:26,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1429/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 4.796598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:26,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43546 samples/s/p 1:24:31 } +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1431/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 4.792399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.44050 samples/s/p 1:24:24 } +2024-07-25 23:48:31,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1433/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 4.7881967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:31,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43418 samples/s/p 1:24:27 } +2024-07-25 23:48:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1435/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 4.7840017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43589 samples/s/p 1:24:22 } +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1437/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 4.7798057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43574 samples/s/p 1:24:19 } +2024-07-25 23:48:40,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1439/ 1625], loss: 0.954, per_step_time: 1473ms, lr: 4.775612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42993 samples/s/p 1:24:22 } +2024-07-25 23:48:43,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1441/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 4.7714207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:43,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43159 samples/s/p 1:24:17 } +2024-07-25 23:48:46,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1443/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 4.7672306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43050 samples/s/p 1:24:15 } +2024-07-25 23:48:49,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1445/ 1625], loss: 1.288, per_step_time: 1474ms, lr: 4.7630424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:49,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42705 samples/s/p 1:24:16 } +2024-07-25 23:48:52,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1447/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 4.758857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:52,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43651 samples/s/p 1:24:04 } +2024-07-25 23:48:55,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1449/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 4.7546737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43036 samples/s/p 1:24:07 } +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1451/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 4.7504914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43022 samples/s/p 1:24:04 } +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1453/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 4.746311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42920 samples/s/p 1:24:02 } +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1455/ 1625], loss: 0.988, per_step_time: 1471ms, lr: 4.742134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43840 samples/s/p 1:23:50 } +2024-07-25 23:49:07,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1457/ 1625], loss: 1.376, per_step_time: 1470ms, lr: 4.737958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:07,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43872 samples/s/p 1:23:47 } +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1459/ 1625], loss: 1.180, per_step_time: 1475ms, lr: 4.7337835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.42255 samples/s/p 1:23:59 } +2024-07-25 23:49:13,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1461/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.7296116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43479 samples/s/p 1:23:45 } +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1463/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 4.7254443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43930 samples/s/p 1:23:38 } +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1465/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 4.721274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44051 samples/s/p 1:23:34 } +2024-07-25 23:49:22,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1467/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 4.7171084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:22,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44417 samples/s/p 1:23:27 } +2024-07-25 23:49:25,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1469/ 1625], loss: 1.019, per_step_time: 1469ms, lr: 4.712947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:25,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44426 samples/s/p 1:23:24 } +2024-07-25 23:49:28,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1471/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 4.708782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:28,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43583 samples/s/p 1:23:29 } +2024-07-25 23:49:31,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1473/ 1625], loss: 1.039, per_step_time: 1475ms, lr: 4.7046224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42355 samples/s/p 1:23:38 } +2024-07-25 23:49:33,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1475/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 4.700467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:33,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42772 samples/s/p 1:23:31 } +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1477/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.6963078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43209 samples/s/p 1:23:24 } +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1479/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 4.692157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43689 samples/s/p 1:23:16 } +2024-07-25 23:49:42,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1481/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 4.688005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:42,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43347 samples/s/p 1:23:17 } +2024-07-25 23:49:45,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1483/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 4.6838522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:45,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43602 samples/s/p 1:23:11 } +2024-07-25 23:49:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1485/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 4.6797063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:48,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43366 samples/s/p 1:23:11 } +2024-07-25 23:49:51,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1487/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 4.6755604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:51,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.42847 samples/s/p 1:23:12 } +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1489/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 4.6714163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43386 samples/s/p 1:23:05 } +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1491/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 4.667274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43094 samples/s/p 1:23:04 } +2024-07-25 23:50:00,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 4.663134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43888 samples/s/p 1:22:54 } +2024-07-25 23:50:03,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1495/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 4.6589967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:03,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43340 samples/s/p 1:22:56 } +2024-07-25 23:50:06,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1497/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 4.6548603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:06,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43589 samples/s/p 1:22:51 } +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1499/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 4.6507257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43668 samples/s/p 1:22:47 } +2024-07-25 23:50:12,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1501/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 4.6465934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:12,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43225 samples/s/p 1:22:48 } +2024-07-25 23:50:15,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1503/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.6424643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43430 samples/s/p 1:22:44 } +2024-07-25 23:50:18,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1505/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 4.6383366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43304 samples/s/p 1:22:42 } +2024-07-25 23:50:21,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1507/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 4.634212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43035 samples/s/p 1:22:41 } +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1509/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 4.630086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43602 samples/s/p 1:22:33 } +2024-07-25 23:50:27,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1511/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 4.6259643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43541 samples/s/p 1:22:31 } +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1513/ 1625], loss: 1.123, per_step_time: 1482ms, lr: 4.621846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.39710 samples/s/p 1:23:03 } +2024-07-25 23:50:33,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1515/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 4.617726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:33,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43946 samples/s/p 1:22:21 } +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1517/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 4.6136106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43006 samples/s/p 1:22:27 } +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1519/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 4.6094983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43787 samples/s/p 1:22:17 } +2024-07-25 23:50:41,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1521/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 4.6053838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.44073 samples/s/p 1:22:11 } +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1523/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 4.6012765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43047 samples/s/p 1:22:18 } +2024-07-25 23:50:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1525/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 4.5971688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:47,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43198 samples/s/p 1:22:13 } +2024-07-25 23:50:50,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1527/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 4.593061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:50,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43299 samples/s/p 1:22:09 } +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1529/ 1625], loss: 1.167, per_step_time: 1470ms, lr: 4.588959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43908 samples/s/p 1:22:01 } +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1531/ 1625], loss: 1.281, per_step_time: 1475ms, lr: 4.5848574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.42365 samples/s/p 1:22:12 } +2024-07-25 23:50:59,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1533/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 4.5807546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:59,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.44058 samples/s/p 1:21:54 } +2024-07-25 23:51:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1535/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 4.5766587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43618 samples/s/p 1:21:55 } +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1537/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 4.5725637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43481 samples/s/p 1:21:53 } +2024-07-25 23:51:08,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1539/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 4.568469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43696 samples/s/p 1:21:48 } +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1541/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 4.5643774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.44026 samples/s/p 1:21:42 } +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1543/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 4.560288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43639 samples/s/p 1:21:43 } +2024-07-25 23:51:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1545/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 4.5561997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:17,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.42883 samples/s/p 1:21:47 } +2024-07-25 23:51:20,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1547/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.5521147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43348 samples/s/p 1:21:39 } +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1549/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.548031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43713 samples/s/p 1:21:33 } +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1551/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 4.5439515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:26,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43487 samples/s/p 1:21:32 } +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1553/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 4.5398697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43557 samples/s/p 1:21:29 } +2024-07-25 23:51:32,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1555/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 4.535792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:32,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43614 samples/s/p 1:21:25 } +2024-07-25 23:51:34,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1557/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 4.531719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43254 samples/s/p 1:21:26 } +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1559/ 1625], loss: 1.250, per_step_time: 1469ms, lr: 4.527643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.44375 samples/s/p 1:21:13 } +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1561/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 4.523571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43850 samples/s/p 1:21:14 } +2024-07-25 23:51:43,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1563/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.519503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:43,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43211 samples/s/p 1:21:17 } +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1565/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 4.5154343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43013 samples/s/p 1:21:16 } +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1567/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 4.51137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43651 samples/s/p 1:21:07 } +2024-07-25 23:51:52,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1569/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 4.5073075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:52,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44434 samples/s/p 1:20:57 } +2024-07-25 23:51:55,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1571/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 4.503243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:55,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43865 samples/s/p 1:21:00 } +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1573/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.4991866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43465 samples/s/p 1:21:00 } +2024-07-25 23:52:01,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1575/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 4.495129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43971 samples/s/p 1:20:53 } +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1577/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 4.491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43533 samples/s/p 1:20:54 } +2024-07-25 23:52:07,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1579/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 4.4870203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:07,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43981 samples/s/p 1:20:47 } +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1581/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 4.482969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43559 samples/s/p 1:20:48 } +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1583/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 4.47892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.42939 samples/s/p 1:20:50 } +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1585/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 4.474872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43585 samples/s/p 1:20:41 } +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1587/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 4.4708277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43277 samples/s/p 1:20:41 } +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1589/ 1625], loss: 1.270, per_step_time: 1474ms, lr: 4.4667863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42598 samples/s/p 1:20:44 } +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1591/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.4627423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43308 samples/s/p 1:20:35 } +2024-07-25 23:52:28,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1593/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 4.4587036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:28,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42993 samples/s/p 1:20:35 } +2024-07-25 23:52:31,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.454668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:31,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43297 samples/s/p 1:20:29 } +2024-07-25 23:52:33,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1597/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.4506323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43803 samples/s/p 1:20:22 } +2024-07-25 23:52:36,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1599/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 4.4465987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:36,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43256 samples/s/p 1:20:24 } +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1601/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 4.4425697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43046 samples/s/p 1:20:23 } +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1603/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 4.4385383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.42888 samples/s/p 1:20:21 } +2024-07-25 23:52:45,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1605/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 4.4345143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:45,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43393 samples/s/p 1:20:14 } +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1607/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 4.4304898e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43883 samples/s/p 1:20:06 } +2024-07-25 23:52:51,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1609/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 4.426465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43504 samples/s/p 1:20:07 } +2024-07-25 23:52:54,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1611/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.4224466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43300 samples/s/p 1:20:06 } +2024-07-25 23:52:57,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1613/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 4.418427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:57,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43711 samples/s/p 1:19:59 } +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1615/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 4.414409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43842 samples/s/p 1:19:55 } +2024-07-25 23:53:03,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1617/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 4.4103963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:03,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43324 samples/s/p 1:19:57 } +2024-07-25 23:53:06,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1619/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 4.4063836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:06,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43808 samples/s/p 1:19:49 } +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1621/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.402373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43569 samples/s/p 1:19:49 } +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1623/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.3983646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43274 samples/s/p 1:19:48 } +2024-07-25 23:53:15,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1625/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 4.394358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:15,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43444 samples/s/p 1:19:44 } +2024-07-25 23:53:18,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 2/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 4.3903538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:18,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42789 samples/s/p 1:19:47 } +2024-07-25 23:53:21,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 4/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 4.3863524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43241 samples/s/p 1:19:40 } +2024-07-25 23:53:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 6/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 4.3823516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:24,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42612 samples/s/p 1:19:42 } +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 8/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 4.3783525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43569 samples/s/p 1:19:31 } +2024-07-25 23:53:30,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 10/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.374357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:30,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43784 samples/s/p 1:19:26 } +2024-07-25 23:53:33,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 12/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 4.3703635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:33,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43391 samples/s/p 1:19:27 } +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 14/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 4.366374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43599 samples/s/p 1:19:22 } +2024-07-25 23:53:38,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 16/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 4.362382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:38,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43178 samples/s/p 1:19:23 } +2024-07-25 23:53:41,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 18/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 4.358393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43810 samples/s/p 1:19:14 } +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 20/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 4.35441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43416 samples/s/p 1:19:15 } +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 22/ 1625], loss: 1.292, per_step_time: 1475ms, lr: 4.350423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42171 samples/s/p 1:19:23 } +2024-07-25 23:53:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 24/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 4.3464447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:50,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42907 samples/s/p 1:19:13 } +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 26/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 4.342464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43526 samples/s/p 1:19:05 } +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 28/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 4.338484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43919 samples/s/p 1:18:58 } +2024-07-25 23:53:59,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 30/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 4.334511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:59,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43734 samples/s/p 1:18:57 } +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 32/ 1625], loss: 1.037, per_step_time: 1469ms, lr: 4.330538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.44316 samples/s/p 1:18:49 } +2024-07-25 23:54:05,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 34/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 4.326564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43497 samples/s/p 1:18:53 } +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 36/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 4.3225964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42671 samples/s/p 1:18:58 } +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 38/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 4.318629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42553 samples/s/p 1:18:56 } +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 40/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 4.3146647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43576 samples/s/p 1:18:44 } +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 42/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 4.310701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43987 samples/s/p 1:18:37 } +2024-07-25 23:54:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 44/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 4.3067403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43523 samples/s/p 1:18:38 } +2024-07-25 23:54:23,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 46/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 4.3027812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:23,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.42722 samples/s/p 1:18:42 } +2024-07-25 23:54:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 48/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 4.2988236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43536 samples/s/p 1:18:32 } +2024-07-25 23:54:29,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 50/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 4.2948686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43252 samples/s/p 1:18:32 } +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 52/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 4.2909155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43923 samples/s/p 1:18:23 } +2024-07-25 23:54:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 54/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 4.286965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.44072 samples/s/p 1:18:19 } +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 56/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 4.283017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43485 samples/s/p 1:18:21 } +2024-07-25 23:54:40,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 58/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 4.2790707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:40,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43312 samples/s/p 1:18:20 } +2024-07-25 23:54:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 60/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 4.2751253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43346 samples/s/p 1:18:16 } +2024-07-25 23:54:46,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 62/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 4.2711836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43925 samples/s/p 1:18:08 } +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 64/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 4.267245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43984 samples/s/p 1:18:05 } +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 66/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 4.263304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43287 samples/s/p 1:18:08 } +2024-07-25 23:54:55,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 68/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 4.2593706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43105 samples/s/p 1:18:07 } +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 70/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 4.2554357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43001 samples/s/p 1:18:05 } +2024-07-25 23:55:01,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 72/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 4.2515017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:01,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43388 samples/s/p 1:17:58 } +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 74/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 4.2475735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43657 samples/s/p 1:17:53 } +2024-07-25 23:55:07,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 76/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 4.2436454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.44036 samples/s/p 1:17:47 } +2024-07-25 23:55:10,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 78/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 4.2397182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43860 samples/s/p 1:17:45 } +2024-07-25 23:55:13,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 80/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.235796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43455 samples/s/p 1:17:46 } +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 82/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 4.231874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43759 samples/s/p 1:17:40 } +2024-07-25 23:55:19,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 84/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.2279544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42878 samples/s/p 1:17:45 } +2024-07-25 23:55:22,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 86/ 1625], loss: 1.093, per_step_time: 1478ms, lr: 4.2240367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.41252 samples/s/p 1:17:56 } +2024-07-25 23:55:25,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 88/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 4.220122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42860 samples/s/p 1:17:39 } +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 90/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 4.2162083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43165 samples/s/p 1:17:34 } +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 92/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 4.2122965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43123 samples/s/p 1:17:31 } +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 94/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 4.2083875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43562 samples/s/p 1:17:24 } +2024-07-25 23:55:36,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 96/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 4.2044812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:36,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43558 samples/s/p 1:17:22 } +2024-07-25 23:55:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 98/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.2005754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43579 samples/s/p 1:17:18 } +2024-07-25 23:55:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 100/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 4.1966723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:42,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43769 samples/s/p 1:17:14 } +2024-07-25 23:55:45,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 102/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 4.192771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43302 samples/s/p 1:17:15 } +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 104/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 4.1888734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43196 samples/s/p 1:17:13 } +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 106/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.1849753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43651 samples/s/p 1:17:06 } +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 108/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.181081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43314 samples/s/p 1:17:06 } +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 110/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 4.177189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43292 samples/s/p 1:17:03 } +2024-07-25 23:56:00,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 112/ 1625], loss: 1.520, per_step_time: 1473ms, lr: 4.1733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:00,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43060 samples/s/p 1:17:02 } +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 114/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 4.1694116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43537 samples/s/p 1:16:55 } +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 116/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 4.1655235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.44042 samples/s/p 1:16:48 } +2024-07-25 23:56:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 118/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 4.1616418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:09,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43865 samples/s/p 1:16:47 } +2024-07-25 23:56:12,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 120/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 4.1577587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:12,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43120 samples/s/p 1:16:50 } +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 122/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 4.15388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44486 samples/s/p 1:16:35 } +2024-07-25 23:56:18,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 124/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 4.150001e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42804 samples/s/p 1:16:47 } +2024-07-25 23:56:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 126/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 4.146126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:21,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43502 samples/s/p 1:16:38 } +2024-07-25 23:56:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 128/ 1625], loss: 0.937, per_step_time: 1473ms, lr: 4.1422522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:24,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42880 samples/s/p 1:16:40 } +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 130/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 4.13838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44070 samples/s/p 1:16:27 } +2024-07-25 23:56:30,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 132/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 4.134511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43752 samples/s/p 1:16:27 } +2024-07-25 23:56:33,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 134/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 4.1306434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:33,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44023 samples/s/p 1:16:22 } +2024-07-25 23:56:35,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 136/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.126778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43615 samples/s/p 1:16:22 } +2024-07-25 23:56:38,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 138/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 4.122915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:38,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42930 samples/s/p 1:16:25 } +2024-07-25 23:56:41,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 140/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 4.1190533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:41,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43976 samples/s/p 1:16:13 } +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 142/ 1625], loss: 1.094, per_step_time: 1478ms, lr: 4.1151943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.41168 samples/s/p 1:16:34 } +2024-07-25 23:56:47,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 144/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.111337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:47,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43741 samples/s/p 1:16:09 } +2024-07-25 23:56:50,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 146/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 4.1074827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43038 samples/s/p 1:16:12 } +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 148/ 1625], loss: 1.280, per_step_time: 1476ms, lr: 4.1036305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.41980 samples/s/p 1:16:18 } +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 150/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 4.099782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43455 samples/s/p 1:16:03 } +2024-07-25 23:56:59,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 152/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 4.0959317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43874 samples/s/p 1:15:56 } +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 154/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 4.092085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43012 samples/s/p 1:16:01 } +2024-07-25 23:57:05,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 156/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 4.0882423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:05,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43425 samples/s/p 1:15:54 } +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 158/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 4.084398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43940 samples/s/p 1:15:47 } +2024-07-25 23:57:11,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 160/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 4.080558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43106 samples/s/p 1:15:51 } +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 162/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 4.076722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43613 samples/s/p 1:15:44 } +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 164/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 4.072886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43405 samples/s/p 1:15:43 } +2024-07-25 23:57:20,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 166/ 1625], loss: 0.903, per_step_time: 1471ms, lr: 4.069052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43777 samples/s/p 1:15:37 } +2024-07-25 23:57:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 168/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.0652208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43655 samples/s/p 1:15:35 } +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 170/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 4.0613913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43558 samples/s/p 1:15:33 } +2024-07-25 23:57:29,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 172/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.0575633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:29,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43608 samples/s/p 1:15:29 } +2024-07-25 23:57:32,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 174/ 1625], loss: 1.329, per_step_time: 1482ms, lr: 4.0537384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.39578 samples/s/p 1:16:00 } +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 176/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 4.0499153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.44169 samples/s/p 1:15:19 } +2024-07-25 23:57:38,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 178/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 4.0460936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:38,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43767 samples/s/p 1:15:19 } +2024-07-25 23:57:40,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 180/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 4.0422756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43537 samples/s/p 1:15:18 } +2024-07-25 23:57:43,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 182/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 4.038459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43624 samples/s/p 1:15:14 } +2024-07-25 23:57:46,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 184/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 4.034644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43287 samples/s/p 1:15:14 } +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 186/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 4.030831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43363 samples/s/p 1:15:11 } +2024-07-25 23:57:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 188/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 4.027021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43969 samples/s/p 1:15:03 } +2024-07-25 23:57:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 190/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.023212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:55,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43535 samples/s/p 1:15:03 } +2024-07-25 23:57:58,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 192/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 4.019406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:58,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.42105 samples/s/p 1:15:12 } +2024-07-25 23:58:01,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 194/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 4.015604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43290 samples/s/p 1:14:59 } +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 196/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 4.0118007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:04,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43752 samples/s/p 1:14:53 } +2024-07-25 23:58:07,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 198/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.0080004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:07,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43709 samples/s/p 1:14:50 } +2024-07-25 23:58:10,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 200/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.0042046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43630 samples/s/p 1:14:48 } +2024-07-25 23:58:13,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 202/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.000406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43630 samples/s/p 1:14:45 } +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 204/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.9966126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43451 samples/s/p 1:14:43 } +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 206/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 3.9928236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.44169 samples/s/p 1:14:35 } +2024-07-25 23:58:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 208/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 3.9890315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43339 samples/s/p 1:14:38 } +2024-07-25 23:58:25,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 210/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 3.9852466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43433 samples/s/p 1:14:35 } +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 212/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 3.9814613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43345 samples/s/p 1:14:33 } +2024-07-25 23:58:31,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 214/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 3.977679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43916 samples/s/p 1:14:25 } +2024-07-25 23:58:34,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 216/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 3.973899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43818 samples/s/p 1:14:23 } +2024-07-25 23:58:37,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 218/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 3.9701185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43299 samples/s/p 1:14:24 } +2024-07-25 23:58:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 220/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 3.9663437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:39,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43325 samples/s/p 1:14:21 } +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 222/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 3.9625684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43551 samples/s/p 1:14:16 } +2024-07-25 23:58:45,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 224/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.958796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:45,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43638 samples/s/p 1:14:12 } +2024-07-25 23:58:48,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 226/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 3.955026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43955 samples/s/p 1:14:07 } +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 228/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 3.951258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43593 samples/s/p 1:14:07 } +2024-07-25 23:58:54,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 230/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 3.947492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44217 samples/s/p 1:13:59 } +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 232/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 3.943728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44105 samples/s/p 1:13:57 } +2024-07-25 23:59:00,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 234/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 3.939966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:00,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44325 samples/s/p 1:13:52 } +2024-07-25 23:59:03,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 236/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.936207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:03,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.44085 samples/s/p 1:13:51 } +2024-07-25 23:59:06,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 238/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 3.9324523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:06,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43420 samples/s/p 1:13:54 } +2024-07-25 23:59:09,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 240/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.928695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43407 samples/s/p 1:13:51 } +2024-07-25 23:59:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 242/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 3.9249417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43328 samples/s/p 1:13:48 } +2024-07-25 23:59:15,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 244/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 3.9211923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43783 samples/s/p 1:13:42 } +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 246/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 3.9174415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43043 samples/s/p 1:13:45 } +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 248/ 1625], loss: 1.137, per_step_time: 1482ms, lr: 3.913695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.39769 samples/s/p 1:14:09 } +2024-07-25 23:59:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 250/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 3.9099527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:24,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.42761 samples/s/p 1:13:41 } +2024-07-25 23:59:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 252/ 1625], loss: 1.115, per_step_time: 1467ms, lr: 3.906208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:27,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.45037 samples/s/p 1:13:20 } +2024-07-25 23:59:30,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 254/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.90247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:30,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43633 samples/s/p 1:13:28 } +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 256/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 3.898732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43765 samples/s/p 1:13:24 } +2024-07-25 23:59:36,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 258/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.894994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43608 samples/s/p 1:13:23 } +2024-07-25 23:59:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 260/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 3.891262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43910 samples/s/p 1:13:17 } +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 262/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.88753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43692 samples/s/p 1:13:16 } +2024-07-25 23:59:44,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 264/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 3.8838007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:44,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43430 samples/s/p 1:13:15 } +2024-07-25 23:59:47,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 266/ 1625], loss: 0.961, per_step_time: 1471ms, lr: 3.880073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43777 samples/s/p 1:13:10 } +2024-07-25 23:59:50,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 268/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.8763483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:50,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43132 samples/s/p 1:13:12 } +2024-07-25 23:59:53,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 270/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 3.872625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43789 samples/s/p 1:13:04 } +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 272/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 3.868904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43051 samples/s/p 1:13:07 } +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 274/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 3.865185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43453 samples/s/p 1:13:00 } +2024-07-26 00:00:02,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 276/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 3.861469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:02,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.42965 samples/s/p 1:13:01 } +2024-07-26 00:00:05,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 278/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 3.8577537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:05,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.44146 samples/s/p 1:12:49 } +2024-07-26 00:00:08,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 280/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 3.8540416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:08,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43708 samples/s/p 1:12:49 } +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 282/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.8503335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43939 samples/s/p 1:12:45 } +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 284/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.8466233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.42991 samples/s/p 1:12:49 } +2024-07-26 00:00:17,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 286/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 3.8429175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:17,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43204 samples/s/p 1:12:45 } +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 288/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 3.839216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43103 samples/s/p 1:12:43 } +2024-07-26 00:00:23,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 290/ 1625], loss: 0.970, per_step_time: 1473ms, lr: 3.8355124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:23,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43064 samples/s/p 1:12:40 } +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 292/ 1625], loss: 1.233, per_step_time: 1469ms, lr: 3.8318144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.44305 samples/s/p 1:12:27 } +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 294/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 3.828117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43117 samples/s/p 1:12:34 } +2024-07-26 00:00:32,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 296/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 3.8244198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43304 samples/s/p 1:12:29 } +2024-07-26 00:00:35,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 298/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 3.820728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:35,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43774 samples/s/p 1:12:22 } +2024-07-26 00:00:38,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 300/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 3.817038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:38,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43429 samples/s/p 1:12:22 } +2024-07-26 00:00:40,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 302/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 3.8133467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43632 samples/s/p 1:12:18 } +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 304/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 3.8096632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43294 samples/s/p 1:12:17 } +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 306/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 3.8059788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42195 samples/s/p 1:12:23 } +2024-07-26 00:00:49,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 308/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 3.802295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:49,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43482 samples/s/p 1:12:10 } +2024-07-26 00:00:52,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 310/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 3.798616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:52,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43470 samples/s/p 1:12:07 } +2024-07-26 00:00:55,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 312/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 3.7949385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:55,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42201 samples/s/p 1:12:14 } +2024-07-26 00:00:58,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 314/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.7912619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:58,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42992 samples/s/p 1:12:05 } +2024-07-26 00:01:01,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 316/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 3.7875889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:01,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43513 samples/s/p 1:11:58 } +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 318/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 3.7839172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43184 samples/s/p 1:11:58 } +2024-07-26 00:01:07,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 320/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 3.7802492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:07,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.44036 samples/s/p 1:11:48 } +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.7765808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43959 samples/s/p 1:11:46 } +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 324/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.772916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43608 samples/s/p 1:11:46 } +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 326/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 3.7692557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.44036 samples/s/p 1:11:39 } +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 328/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 3.7655932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43479 samples/s/p 1:11:41 } +2024-07-26 00:01:22,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 3.7619338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.44013 samples/s/p 1:11:34 } +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 332/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 3.75828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43174 samples/s/p 1:11:37 } +2024-07-26 00:01:28,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 334/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 3.7546238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:28,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44146 samples/s/p 1:11:27 } +2024-07-26 00:01:31,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 336/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 3.750974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44036 samples/s/p 1:11:25 } +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 338/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 3.7473242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43447 samples/s/p 1:11:26 } +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 340/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 3.7436744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43414 samples/s/p 1:11:24 } +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 342/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 3.740031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:39,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43577 samples/s/p 1:11:19 } +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 344/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 3.736388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43255 samples/s/p 1:11:19 } +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 346/ 1625], loss: 0.863, per_step_time: 1471ms, lr: 3.732745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43507 samples/s/p 1:11:14 } +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 348/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.7291084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43753 samples/s/p 1:11:09 } +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 3.7254713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42955 samples/s/p 1:11:12 } +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 352/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.721836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43501 samples/s/p 1:11:05 } +2024-07-26 00:01:57,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 354/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 3.7182035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43164 samples/s/p 1:11:05 } +2024-07-26 00:02:00,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 356/ 1625], loss: 1.363, per_step_time: 1475ms, lr: 3.7145737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:00,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42222 samples/s/p 1:11:09 } +2024-07-26 00:02:03,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 358/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 3.7109462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42783 samples/s/p 1:11:02 } +2024-07-26 00:02:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 360/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.70732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43804 samples/s/p 1:10:51 } +2024-07-26 00:02:09,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 362/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 3.7036962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43612 samples/s/p 1:10:50 } +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 364/ 1625], loss: 1.313, per_step_time: 1475ms, lr: 3.7000773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42370 samples/s/p 1:10:56 } +2024-07-26 00:02:15,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 366/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 3.6964552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:15,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43744 samples/s/p 1:10:43 } +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 368/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 3.6928382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43374 samples/s/p 1:10:43 } +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 370/ 1625], loss: 1.399, per_step_time: 1474ms, lr: 3.6892257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42720 samples/s/p 1:10:45 } +2024-07-26 00:02:24,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 372/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 3.6856104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:24,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42815 samples/s/p 1:10:41 } +2024-07-26 00:02:27,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 374/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6819997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43600 samples/s/p 1:10:32 } +2024-07-26 00:02:30,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 376/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 3.678394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43073 samples/s/p 1:10:33 } +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 378/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 3.6747856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42873 samples/s/p 1:10:32 } +2024-07-26 00:02:36,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 380/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 3.671183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42579 samples/s/p 1:10:31 } +2024-07-26 00:02:39,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 382/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 3.667582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43334 samples/s/p 1:10:22 } +2024-07-26 00:02:41,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 384/ 1625], loss: 1.105, per_step_time: 1474ms, lr: 3.6639794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42408 samples/s/p 1:10:27 } +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 386/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 3.6603833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43354 samples/s/p 1:10:16 } +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 388/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.656788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43321 samples/s/p 1:10:14 } +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 390/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6531942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43032 samples/s/p 1:10:13 } +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 392/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 3.6496049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43678 samples/s/p 1:10:05 } +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 394/ 1625], loss: 0.928, per_step_time: 1473ms, lr: 3.6460156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42780 samples/s/p 1:10:09 } +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 396/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 3.642429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43386 samples/s/p 1:10:01 } +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 398/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 3.638845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43822 samples/s/p 1:09:55 } +2024-07-26 00:03:05,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 400/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6352626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:05,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43728 samples/s/p 1:09:53 } +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 402/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 3.6316828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43237 samples/s/p 1:09:54 } +2024-07-26 00:03:11,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 404/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 3.6281049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:11,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43428 samples/s/p 1:09:49 } +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 406/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 3.6245292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43093 samples/s/p 1:09:49 } +2024-07-26 00:03:17,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 408/ 1625], loss: 1.059, per_step_time: 1473ms, lr: 3.6209553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:17,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43108 samples/s/p 1:09:46 } +2024-07-26 00:03:20,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 410/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6173842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:20,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.42849 samples/s/p 1:09:45 } +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 412/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 3.613815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43177 samples/s/p 1:09:39 } +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 414/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 3.6102506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43209 samples/s/p 1:09:36 } +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 416/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.606684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43209 samples/s/p 1:09:33 } +2024-07-26 00:03:32,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 418/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 3.6031215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:32,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43274 samples/s/p 1:09:30 } +2024-07-26 00:03:35,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 420/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.5995631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43253 samples/s/p 1:09:27 } +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 422/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 3.5960024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43550 samples/s/p 1:09:22 } +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 424/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.5924495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43467 samples/s/p 1:09:19 } +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 426/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.5888947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43098 samples/s/p 1:09:19 } +2024-07-26 00:03:46,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 428/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.5853418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:46,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43550 samples/s/p 1:09:13 } +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 430/ 1625], loss: 1.095, per_step_time: 1473ms, lr: 3.5817948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43005 samples/s/p 1:09:14 } +2024-07-26 00:03:52,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 432/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 3.5782468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:52,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43763 samples/s/p 1:09:05 } +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 434/ 1625], loss: 1.134, per_step_time: 1473ms, lr: 3.5747025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42981 samples/s/p 1:09:08 } +2024-07-26 00:03:58,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 436/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.57116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:58,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43454 samples/s/p 1:09:02 } +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 438/ 1625], loss: 1.138, per_step_time: 1474ms, lr: 3.567619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42531 samples/s/p 1:09:06 } +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 440/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 3.5640805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43838 samples/s/p 1:08:53 } +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 442/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 3.5605449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43077 samples/s/p 1:08:56 } +2024-07-26 00:04:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 444/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.557011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43365 samples/s/p 1:08:51 } +2024-07-26 00:04:13,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 446/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 3.5534795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:13,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43113 samples/s/p 1:08:50 } +2024-07-26 00:04:16,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 448/ 1625], loss: 1.162, per_step_time: 1485ms, lr: 3.5499497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:16,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.38433 samples/s/p 1:09:23 } +2024-07-26 00:04:19,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 450/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 3.5464218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43569 samples/s/p 1:08:40 } +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 452/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.5428975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43462 samples/s/p 1:08:38 } +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 454/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 3.5393746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43629 samples/s/p 1:08:34 } +2024-07-26 00:04:28,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 456/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.5358544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:28,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43632 samples/s/p 1:08:31 } +2024-07-26 00:04:31,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.532336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:31,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43380 samples/s/p 1:08:30 } +2024-07-26 00:04:34,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 460/ 1625], loss: 1.344, per_step_time: 1476ms, lr: 3.5288194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:34,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.41839 samples/s/p 1:08:39 } +2024-07-26 00:04:37,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 462/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 3.525307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:37,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43307 samples/s/p 1:08:25 } +2024-07-26 00:04:40,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 464/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.5217954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:40,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43259 samples/s/p 1:08:22 } +2024-07-26 00:04:43,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 466/ 1625], loss: 1.228, per_step_time: 1475ms, lr: 3.5182838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.42353 samples/s/p 1:08:26 } +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 468/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.5147787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43773 samples/s/p 1:08:12 } +2024-07-26 00:04:48,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 3.511273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43871 samples/s/p 1:08:09 } +2024-07-26 00:04:51,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 472/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 3.5077683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:51,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44230 samples/s/p 1:08:03 } +2024-07-26 00:04:54,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 474/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 3.50427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:54,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44390 samples/s/p 1:07:59 } +2024-07-26 00:04:57,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 476/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 3.5007715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:57,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43873 samples/s/p 1:08:00 } +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 478/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 3.4972754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43140 samples/s/p 1:08:02 } +2024-07-26 00:05:03,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 480/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 3.4937802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:03,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43594 samples/s/p 1:07:56 } +2024-07-26 00:05:06,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 482/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 3.4902887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:06,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.44008 samples/s/p 1:07:50 } +2024-07-26 00:05:09,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 484/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 3.4867994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43822 samples/s/p 1:07:48 } +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 486/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.4833124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43439 samples/s/p 1:07:48 } +2024-07-26 00:05:15,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 488/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 3.4798268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:15,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43356 samples/s/p 1:07:46 } +2024-07-26 00:05:18,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 490/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 3.4763439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:18,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43454 samples/s/p 1:07:42 } +2024-07-26 00:05:21,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 492/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 3.4728632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43139 samples/s/p 1:07:42 } +2024-07-26 00:05:24,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 494/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 3.4693844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:24,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43659 samples/s/p 1:07:35 } +2024-07-26 00:05:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 496/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 3.4659074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:27,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43493 samples/s/p 1:07:33 } +2024-07-26 00:05:30,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 498/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 3.4624331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:30,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43129 samples/s/p 1:07:33 } +2024-07-26 00:05:33,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 500/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 3.4589616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43930 samples/s/p 1:07:24 } +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 502/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 3.4554914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43028 samples/s/p 1:07:28 } +2024-07-26 00:05:39,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 504/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 3.452024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42615 samples/s/p 1:07:28 } +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 506/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 3.448562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43414 samples/s/p 1:07:19 } +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 508/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 3.4450968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43039 samples/s/p 1:07:19 } +2024-07-26 00:05:47,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 510/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 3.4416348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:47,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43203 samples/s/p 1:07:15 } +2024-07-26 00:05:50,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 512/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 3.4381792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42962 samples/s/p 1:07:14 } +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 514/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 3.4347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43365 samples/s/p 1:07:08 } +2024-07-26 00:05:56,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 516/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 3.431267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42499 samples/s/p 1:07:11 } +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 518/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 3.4278169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42819 samples/s/p 1:07:06 } +2024-07-26 00:06:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 520/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 3.4243667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:02,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43361 samples/s/p 1:06:59 } +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 522/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 3.4209197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43518 samples/s/p 1:06:55 } +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 524/ 1625], loss: 0.867, per_step_time: 1471ms, lr: 3.417474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43523 samples/s/p 1:06:52 } +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 526/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.4140307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43781 samples/s/p 1:06:47 } +2024-07-26 00:06:14,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 528/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.4105901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:14,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43620 samples/s/p 1:06:45 } +2024-07-26 00:06:17,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 530/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 3.4071522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:17,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43670 samples/s/p 1:06:42 } +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 532/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 3.4037148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43564 samples/s/p 1:06:40 } +2024-07-26 00:06:23,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 534/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 3.400282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43756 samples/s/p 1:06:35 } +2024-07-26 00:06:26,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 536/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 3.39685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:26,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43454 samples/s/p 1:06:35 } +2024-07-26 00:06:29,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 538/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.3934198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43764 samples/s/p 1:06:29 } +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 540/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.3899928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43639 samples/s/p 1:06:27 } +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 542/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 3.386568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.44239 samples/s/p 1:06:20 } +2024-07-26 00:06:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 544/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.3831452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:38,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43556 samples/s/p 1:06:22 } +2024-07-26 00:06:41,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 546/ 1625], loss: 1.099, per_step_time: 1473ms, lr: 3.3797246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:41,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43031 samples/s/p 1:06:23 } +2024-07-26 00:06:44,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 548/ 1625], loss: 1.089, per_step_time: 1468ms, lr: 3.3763054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:44,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.44763 samples/s/p 1:06:07 } +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 550/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3728916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43362 samples/s/p 1:06:15 } +2024-07-26 00:06:49,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 552/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 3.369476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:49,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43180 samples/s/p 1:06:13 } +2024-07-26 00:06:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 554/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 3.366064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:52,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43752 samples/s/p 1:06:06 } +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 556/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 3.3626561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43384 samples/s/p 1:06:06 } +2024-07-26 00:06:58,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 558/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3592482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43188 samples/s/p 1:06:04 } +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 560/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 3.3558422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43874 samples/s/p 1:05:56 } +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 562/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 3.3524425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43319 samples/s/p 1:05:57 } +2024-07-26 00:07:07,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 564/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 3.3490414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43287 samples/s/p 1:05:55 } +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 566/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 3.345643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.42817 samples/s/p 1:05:55 } +2024-07-26 00:07:13,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 568/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 3.3422466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:13,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43394 samples/s/p 1:05:48 } +2024-07-26 00:07:16,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 570/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 3.3388533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:16,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.44026 samples/s/p 1:05:40 } +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 572/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.3354622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43368 samples/s/p 1:05:42 } +2024-07-26 00:07:22,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 574/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 3.3320725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:22,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43555 samples/s/p 1:05:38 } +2024-07-26 00:07:25,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 576/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.3286851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43232 samples/s/p 1:05:37 } +2024-07-26 00:07:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 578/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.325301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:28,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43532 samples/s/p 1:05:32 } +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 580/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.321918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43318 samples/s/p 1:05:31 } +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 582/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 3.318538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.42995 samples/s/p 1:05:30 } +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 584/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.3151605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43152 samples/s/p 1:05:26 } +2024-07-26 00:07:40,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 586/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 3.3117835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:40,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43411 samples/s/p 1:05:21 } +2024-07-26 00:07:43,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 588/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 3.3084107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:43,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43708 samples/s/p 1:05:16 } +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 590/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 3.3050396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.42973 samples/s/p 1:05:19 } +2024-07-26 00:07:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 592/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 3.3016709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:48,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.44005 samples/s/p 1:05:08 } +2024-07-26 00:07:51,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 594/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.2983044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:51,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43466 samples/s/p 1:05:09 } +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 596/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 3.2949383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43005 samples/s/p 1:05:10 } +2024-07-26 00:07:57,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 598/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 3.2915755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43550 samples/s/p 1:05:03 } +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 600/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 3.2882176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43201 samples/s/p 1:05:02 } +2024-07-26 00:08:03,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 602/ 1625], loss: 1.340, per_step_time: 1470ms, lr: 3.2848575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:03,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.44090 samples/s/p 1:04:53 } +2024-07-26 00:08:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 604/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 3.281505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:06,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43698 samples/s/p 1:04:53 } +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 606/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 3.2781509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.42745 samples/s/p 1:04:57 } +2024-07-26 00:08:12,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 608/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 3.274798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:12,589 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43264 samples/s/p 1:04:50 } +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 610/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 3.271452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43858 samples/s/p 1:04:43 } +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 612/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.2681055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43693 samples/s/p 1:04:41 } +2024-07-26 00:08:21,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 614/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 3.2647613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:21,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43674 samples/s/p 1:04:38 } +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 616/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 3.2614184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43166 samples/s/p 1:04:39 } +2024-07-26 00:08:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 618/ 1625], loss: 1.291, per_step_time: 1470ms, lr: 3.2580788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43893 samples/s/p 1:04:31 } +2024-07-26 00:08:30,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 620/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.2547418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:30,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43716 samples/s/p 1:04:29 } +2024-07-26 00:08:33,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 622/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 3.2514067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43799 samples/s/p 1:04:26 } +2024-07-26 00:08:36,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 624/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 3.2480734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:36,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43719 samples/s/p 1:04:23 } +2024-07-26 00:08:39,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 626/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 3.2447433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:39,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.44190 samples/s/p 1:04:17 } +2024-07-26 00:08:42,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 628/ 1625], loss: 1.020, per_step_time: 1470ms, lr: 3.241415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:42,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43895 samples/s/p 1:04:16 } +2024-07-26 00:08:45,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 630/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.2380885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43549 samples/s/p 1:04:16 } +2024-07-26 00:08:47,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 632/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.2347662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:47,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42748 samples/s/p 1:04:18 } +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 634/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 3.2314433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42936 samples/s/p 1:04:14 } +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 636/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.2281246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43469 samples/s/p 1:04:07 } +2024-07-26 00:08:56,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 638/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.224808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:56,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43571 samples/s/p 1:04:04 } +2024-07-26 00:08:59,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 640/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 3.221492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:59,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42882 samples/s/p 1:04:06 } +2024-07-26 00:09:02,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 642/ 1625], loss: 1.075, per_step_time: 1473ms, lr: 3.2181792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:02,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.42957 samples/s/p 1:04:02 } +2024-07-26 00:09:05,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 644/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 3.214871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:05,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43559 samples/s/p 1:03:55 } +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 646/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 3.2115609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43428 samples/s/p 1:03:53 } +2024-07-26 00:09:11,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 648/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.2082567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:11,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43779 samples/s/p 1:03:48 } +2024-07-26 00:09:14,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 650/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 3.2049534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:14,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43552 samples/s/p 1:03:46 } +2024-07-26 00:09:17,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 652/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 3.20165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:17,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.44368 samples/s/p 1:03:38 } +2024-07-26 00:09:20,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 654/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 3.1983536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:20,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43751 samples/s/p 1:03:39 } +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 656/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 3.1950567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43203 samples/s/p 1:03:40 } +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 658/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 3.1917602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43499 samples/s/p 1:03:35 } +2024-07-26 00:09:29,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 660/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.1884701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:29,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43400 samples/s/p 1:03:33 } +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 662/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 3.1851805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43680 samples/s/p 1:03:28 } +2024-07-26 00:09:35,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 664/ 1625], loss: 0.933, per_step_time: 1478ms, lr: 3.1818931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:35,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.41056 samples/s/p 1:03:43 } +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 666/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 3.1786071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43346 samples/s/p 1:03:24 } +2024-07-26 00:09:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 668/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 3.1753243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:41,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.42992 samples/s/p 1:03:24 } +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 670/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 3.1720447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43159 samples/s/p 1:03:19 } +2024-07-26 00:09:47,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 672/ 1625], loss: 1.009, per_step_time: 1475ms, lr: 3.1687646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:47,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.42167 samples/s/p 1:03:23 } +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 674/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 3.1654881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43349 samples/s/p 1:03:12 } +2024-07-26 00:09:52,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 676/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 3.1622171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.42987 samples/s/p 1:03:12 } +2024-07-26 00:09:55,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 678/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 3.1589434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43977 samples/s/p 1:03:02 } +2024-07-26 00:09:58,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 680/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.1556738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:58,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43681 samples/s/p 1:03:01 } +2024-07-26 00:10:01,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 682/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 3.1524087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43394 samples/s/p 1:03:00 } +2024-07-26 00:10:04,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 684/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.1491418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:04,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43546 samples/s/p 1:02:56 } +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 686/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.1458799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43648 samples/s/p 1:02:53 } +2024-07-26 00:10:10,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 688/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.1426216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:10,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43398 samples/s/p 1:02:51 } +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 690/ 1625], loss: 1.115, per_step_time: 1469ms, lr: 3.1393615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.44321 samples/s/p 1:02:42 } +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 692/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 3.1361074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43651 samples/s/p 1:02:44 } +2024-07-26 00:10:19,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 694/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 3.1328536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:19,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43887 samples/s/p 1:02:39 } +2024-07-26 00:10:22,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 696/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 3.1296004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.42923 samples/s/p 1:02:43 } +2024-07-26 00:10:25,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 698/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.1263544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:25,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43560 samples/s/p 1:02:35 } +2024-07-26 00:10:28,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 700/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.123107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43619 samples/s/p 1:02:32 } +2024-07-26 00:10:31,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 702/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 3.119862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43454 samples/s/p 1:02:30 } +2024-07-26 00:10:34,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 704/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 3.116621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43282 samples/s/p 1:02:29 } +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 706/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 3.1133818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43049 samples/s/p 1:02:27 } +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 708/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 3.110144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43980 samples/s/p 1:02:18 } +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 710/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 3.106909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.44013 samples/s/p 1:02:15 } +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 712/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 3.1036766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43272 samples/s/p 1:02:17 } +2024-07-26 00:10:49,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 714/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 3.100446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:49,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43146 samples/s/p 1:02:15 } +2024-07-26 00:10:51,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 716/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.0972174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:51,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43189 samples/s/p 1:02:12 } +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 718/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 3.093991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43474 samples/s/p 1:02:07 } +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 720/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.090769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43726 samples/s/p 1:02:02 } +2024-07-26 00:11:00,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 722/ 1625], loss: 1.131, per_step_time: 1474ms, lr: 3.0875462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:00,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.42519 samples/s/p 1:02:07 } +2024-07-26 00:11:03,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 724/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 3.0843275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:03,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43263 samples/s/p 1:01:59 } +2024-07-26 00:11:06,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 726/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 3.0811125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:06,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43669 samples/s/p 1:01:54 } +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 728/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 3.0778956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43374 samples/s/p 1:01:53 } +2024-07-26 00:11:12,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 730/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 3.0746833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43556 samples/s/p 1:01:48 } +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 732/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 3.071475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42811 samples/s/p 1:01:51 } +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 734/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 3.0682659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42514 samples/s/p 1:01:50 } +2024-07-26 00:11:21,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 736/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 3.0650622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42976 samples/s/p 1:01:44 } +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 738/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 3.0618598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43605 samples/s/p 1:01:36 } +2024-07-26 00:11:27,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 740/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.058657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43686 samples/s/p 1:01:33 } +2024-07-26 00:11:30,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 742/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 3.0554602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43498 samples/s/p 1:01:31 } +2024-07-26 00:11:33,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 744/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 3.0522642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:33,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43503 samples/s/p 1:01:28 } +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 746/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 3.0490683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42847 samples/s/p 1:01:30 } +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 748/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 3.045879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43448 samples/s/p 1:01:23 } +2024-07-26 00:11:42,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 750/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 3.042689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42973 samples/s/p 1:01:23 } +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 752/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 3.0395022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43748 samples/s/p 1:01:15 } +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 754/ 1625], loss: 1.324, per_step_time: 1471ms, lr: 3.0363185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43510 samples/s/p 1:01:13 } +2024-07-26 00:11:50,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 756/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 3.0331362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:50,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44184 samples/s/p 1:01:06 } +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 758/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 3.0299557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43113 samples/s/p 1:01:10 } +2024-07-26 00:11:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 760/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 3.026778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42898 samples/s/p 1:01:09 } +2024-07-26 00:11:59,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 762/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 3.0236024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:59,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43314 samples/s/p 1:01:03 } +2024-07-26 00:12:02,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 764/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 3.0204305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:02,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42865 samples/s/p 1:01:03 } +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 766/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 3.0172578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43871 samples/s/p 1:00:53 } +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 768/ 1625], loss: 1.183, per_step_time: 1468ms, lr: 3.0140895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44605 samples/s/p 1:00:45 } +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 770/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 3.0109254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43303 samples/s/p 1:00:51 } +2024-07-26 00:12:14,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 772/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 3.0077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44170 samples/s/p 1:00:42 } +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 774/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 3.004599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43607 samples/s/p 1:00:43 } +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 776/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.0014398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44042 samples/s/p 1:00:37 } +2024-07-26 00:12:23,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 778/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9982812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43402 samples/s/p 1:00:39 } +2024-07-26 00:12:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 780/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.9951293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:26,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44054 samples/s/p 1:00:31 } +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 782/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.9919756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43490 samples/s/p 1:00:32 } +2024-07-26 00:12:32,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 784/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.9888242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43411 samples/s/p 1:00:30 } +2024-07-26 00:12:35,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 786/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9856783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:35,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43691 samples/s/p 1:00:25 } +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 788/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9825324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43370 samples/s/p 1:00:24 } +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 790/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9793891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43262 samples/s/p 1:00:22 } +2024-07-26 00:12:44,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 792/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9762482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:44,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43850 samples/s/p 1:00:15 } +2024-07-26 00:12:47,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 794/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.97311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:47,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43259 samples/s/p 1:00:16 } +2024-07-26 00:12:50,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 796/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.9699736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:50,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.42888 samples/s/p 1:00:16 } +2024-07-26 00:12:52,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 798/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.96684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:52,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.44176 samples/s/p 1:00:04 } +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 800/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43474 samples/s/p 1:00:06 } +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 802/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.960579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43433 samples/s/p 1:00:03 } +2024-07-26 00:13:01,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 804/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9574521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43343 samples/s/p 1:00:01 } +2024-07-26 00:13:04,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 806/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.954328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:04,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42774 samples/s/p 1:00:02 } +2024-07-26 00:13:07,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 808/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 2.9512053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43064 samples/s/p 0:59:57 } +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 810/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.9480843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.44164 samples/s/p 0:59:47 } +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 812/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.944967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43501 samples/s/p 0:59:48 } +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 814/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.941853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42747 samples/s/p 0:59:50 } +2024-07-26 00:13:19,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 816/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9387393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43248 samples/s/p 0:59:44 } +2024-07-26 00:13:22,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9356302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43307 samples/s/p 0:59:41 } +2024-07-26 00:13:25,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 820/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9325206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43273 samples/s/p 0:59:38 } +2024-07-26 00:13:28,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 822/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.9294138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:28,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43317 samples/s/p 0:59:35 } +2024-07-26 00:13:31,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 824/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.926312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43240 samples/s/p 0:59:32 } +2024-07-26 00:13:34,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 826/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.9232092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:34,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43385 samples/s/p 0:59:28 } +2024-07-26 00:13:37,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 828/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 2.9201092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:37,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43072 samples/s/p 0:59:27 } +2024-07-26 00:13:40,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 830/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.9170133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43326 samples/s/p 0:59:23 } +2024-07-26 00:13:43,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 832/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.91392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43282 samples/s/p 0:59:20 } +2024-07-26 00:13:46,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 834/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 2.9108269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43831 samples/s/p 0:59:14 } +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 836/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9077378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43957 samples/s/p 0:59:10 } +2024-07-26 00:13:51,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 838/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.9046491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43836 samples/s/p 0:59:08 } +2024-07-26 00:13:54,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 840/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9015653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:54,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43620 samples/s/p 0:59:06 } +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 842/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.8984814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43652 samples/s/p 0:59:03 } +2024-07-26 00:14:00,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 844/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 2.8954005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:00,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43047 samples/s/p 0:59:04 } +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 846/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.8923228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43594 samples/s/p 0:58:57 } +2024-07-26 00:14:06,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 848/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.8892468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:06,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43767 samples/s/p 0:58:53 } +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 850/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8861737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43721 samples/s/p 0:58:51 } +2024-07-26 00:14:12,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 852/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.8831018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.42975 samples/s/p 0:58:53 } +2024-07-26 00:14:15,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 854/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8800328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:15,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43164 samples/s/p 0:58:48 } +2024-07-26 00:14:18,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 856/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.8769664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:18,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43215 samples/s/p 0:58:45 } +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 858/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.8739028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43834 samples/s/p 0:58:38 } +2024-07-26 00:14:24,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 860/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.8708405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:24,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43821 samples/s/p 0:58:35 } +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 862/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 2.8677819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43297 samples/s/p 0:58:36 } +2024-07-26 00:14:30,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 864/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.864725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43519 samples/s/p 0:58:31 } +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 866/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.861669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43560 samples/s/p 0:58:28 } +2024-07-26 00:14:36,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 868/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.8586173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:36,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43348 samples/s/p 0:58:27 } +2024-07-26 00:14:39,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 870/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 2.8555673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:39,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43637 samples/s/p 0:58:22 } +2024-07-26 00:14:42,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 872/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.8525174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:42,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43477 samples/s/p 0:58:20 } +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 874/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 2.8494742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.44366 samples/s/p 0:58:11 } +2024-07-26 00:14:48,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.846431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43546 samples/s/p 0:58:14 } +2024-07-26 00:14:50,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 878/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8433897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43587 samples/s/p 0:58:10 } +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 880/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.840351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43205 samples/s/p 0:58:10 } +2024-07-26 00:14:56,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 882/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8373138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43712 samples/s/p 0:58:04 } +2024-07-26 00:14:59,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 884/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.834281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:59,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43785 samples/s/p 0:58:00 } +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 886/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.8312493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43517 samples/s/p 0:57:59 } +2024-07-26 00:15:05,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 888/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.8282202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:05,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43953 samples/s/p 0:57:53 } +2024-07-26 00:15:08,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 890/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.8251925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:08,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43240 samples/s/p 0:57:55 } +2024-07-26 00:15:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 892/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.8221684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:11,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43639 samples/s/p 0:57:49 } +2024-07-26 00:15:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 894/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.8191462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:14,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43993 samples/s/p 0:57:44 } +2024-07-26 00:15:17,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 896/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.8161264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43882 samples/s/p 0:57:42 } +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 898/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 2.8131085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44151 samples/s/p 0:57:37 } +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 900/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 2.810094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43190 samples/s/p 0:57:41 } +2024-07-26 00:15:26,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.8070801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43121 samples/s/p 0:57:38 } +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 904/ 1625], loss: 0.917, per_step_time: 1471ms, lr: 2.8040708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43637 samples/s/p 0:57:32 } +2024-07-26 00:15:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 906/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.801064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:32,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43572 samples/s/p 0:57:29 } +2024-07-26 00:15:35,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 908/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.7980554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43792 samples/s/p 0:57:25 } +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 910/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.795052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43405 samples/s/p 0:57:24 } +2024-07-26 00:15:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 912/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.7920532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:41,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.42823 samples/s/p 0:57:25 } +2024-07-26 00:15:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 914/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.7890542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43243 samples/s/p 0:57:20 } +2024-07-26 00:15:47,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 916/ 1625], loss: 0.870, per_step_time: 1472ms, lr: 2.7860576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43212 samples/s/p 0:57:17 } +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 918/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7830638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:50,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43523 samples/s/p 0:57:12 } +2024-07-26 00:15:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 920/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7800718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43583 samples/s/p 0:57:09 } +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 922/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.7770823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43618 samples/s/p 0:57:05 } +2024-07-26 00:15:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 924/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 2.7740953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:58,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43316 samples/s/p 0:57:04 } +2024-07-26 00:16:01,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 926/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.771111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43368 samples/s/p 0:57:01 } +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 928/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.7681276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43248 samples/s/p 0:56:59 } +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 930/ 1625], loss: 0.997, per_step_time: 1472ms, lr: 2.7651486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43451 samples/s/p 0:56:55 } +2024-07-26 00:16:10,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 932/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7621702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:10,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43823 samples/s/p 0:56:49 } +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 934/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.7591964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.42951 samples/s/p 0:56:52 } +2024-07-26 00:16:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 936/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.7562223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:16,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43239 samples/s/p 0:56:47 } +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 938/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.7532528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43872 samples/s/p 0:56:40 } +2024-07-26 00:16:22,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 940/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.750283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43536 samples/s/p 0:56:39 } +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 942/ 1625], loss: 1.108, per_step_time: 1475ms, lr: 2.747317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.42050 samples/s/p 0:56:46 } +2024-07-26 00:16:28,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 944/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.744356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:28,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43319 samples/s/p 0:56:35 } +2024-07-26 00:16:31,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 946/ 1625], loss: 0.959, per_step_time: 1470ms, lr: 2.7413932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43938 samples/s/p 0:56:28 } +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 948/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 2.738434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43716 samples/s/p 0:56:27 } +2024-07-26 00:16:37,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 950/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.735479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44107 samples/s/p 0:56:21 } +2024-07-26 00:16:40,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 952/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.732524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:40,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43399 samples/s/p 0:56:23 } +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 954/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7295719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43264 samples/s/p 0:56:21 } +2024-07-26 00:16:46,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 956/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7266237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:46,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43407 samples/s/p 0:56:17 } +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 958/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.7236756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43126 samples/s/p 0:56:16 } +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 960/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.720732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43134 samples/s/p 0:56:13 } +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 962/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.7177894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43767 samples/s/p 0:56:06 } +2024-07-26 00:16:57,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 964/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.714848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43599 samples/s/p 0:56:04 } +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 966/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.7119122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.44148 samples/s/p 0:55:57 } +2024-07-26 00:17:03,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 968/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.7089773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43376 samples/s/p 0:55:59 } +2024-07-26 00:17:06,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 970/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.7060437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:06,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43531 samples/s/p 0:55:55 } +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 972/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.703113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.42956 samples/s/p 0:55:56 } +2024-07-26 00:17:12,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 974/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.700185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:12,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43785 samples/s/p 0:55:48 } +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 976/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.6972593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43323 samples/s/p 0:55:48 } +2024-07-26 00:17:18,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6943355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:18,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43211 samples/s/p 0:55:46 } +2024-07-26 00:17:21,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 980/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 2.6914145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:21,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43099 samples/s/p 0:55:43 } +2024-07-26 00:17:24,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 982/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6884966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43757 samples/s/p 0:55:36 } +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 984/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.6855796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43571 samples/s/p 0:55:34 } +2024-07-26 00:17:30,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 986/ 1625], loss: 1.115, per_step_time: 1474ms, lr: 2.6826654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:30,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42674 samples/s/p 0:55:37 } +2024-07-26 00:17:33,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 988/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.679756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42681 samples/s/p 0:55:34 } +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 990/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.6768446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43349 samples/s/p 0:55:27 } +2024-07-26 00:17:39,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 992/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.673938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:39,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43611 samples/s/p 0:55:22 } +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 994/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.671035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43652 samples/s/p 0:55:19 } +2024-07-26 00:17:45,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 996/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.668131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:45,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42717 samples/s/p 0:55:22 } +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 998/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 2.6652315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43851 samples/s/p 0:55:12 } +2024-07-26 00:17:51,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1000/ 1625], loss: 1.319, per_step_time: 1469ms, lr: 2.662336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44293 samples/s/p 0:55:07 } +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:18:27,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1002/ 1625], loss: 1.150, per_step_time: 2156ms, lr: 2.659439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 3.70931 samples/s/p 1:20:48 } +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1004/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.656548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.42495 samples/s/p 0:55:12 } +2024-07-26 00:18:32,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1006/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.653658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:32,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44513 samples/s/p 0:54:56 } +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1008/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.6507678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43705 samples/s/p 0:54:58 } +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1010/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.6478838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43280 samples/s/p 0:54:58 } +2024-07-26 00:18:41,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1012/ 1625], loss: 0.992, per_step_time: 1471ms, lr: 2.6450007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:41,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43603 samples/s/p 0:54:53 } +2024-07-26 00:18:44,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1014/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.6421183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43800 samples/s/p 0:54:49 } +2024-07-26 00:18:47,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1016/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.639241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:47,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43326 samples/s/p 0:54:49 } +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1018/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.6363648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44174 samples/s/p 0:54:41 } +2024-07-26 00:18:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1020/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.633492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43574 samples/s/p 0:54:41 } +2024-07-26 00:18:56,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1022/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 2.6306209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:56,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44026 samples/s/p 0:54:36 } +2024-07-26 00:18:59,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1024/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.6277507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43283 samples/s/p 0:54:37 } +2024-07-26 00:19:02,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1026/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6248856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43668 samples/s/p 0:54:32 } +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1028/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6220205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43418 samples/s/p 0:54:31 } +2024-07-26 00:19:08,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1030/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.619159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:08,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43403 samples/s/p 0:54:28 } +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1032/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.616301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43171 samples/s/p 0:54:26 } +2024-07-26 00:19:14,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1034/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.613442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43158 samples/s/p 0:54:23 } +2024-07-26 00:19:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1036/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.6105872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:17,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43345 samples/s/p 0:54:19 } +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1038/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.6077369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43241 samples/s/p 0:54:17 } +2024-07-26 00:19:23,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1040/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.6048856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43311 samples/s/p 0:54:14 } +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1042/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.6020389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43181 samples/s/p 0:54:11 } +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1044/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5991944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43700 samples/s/p 0:54:05 } +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1046/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.44103 samples/s/p 0:54:00 } +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1048/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.593511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43119 samples/s/p 0:54:03 } +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1050/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 2.590673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43737 samples/s/p 0:53:56 } +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1052/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.5878362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.42955 samples/s/p 0:53:58 } +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1054/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 2.585004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:43,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43024 samples/s/p 0:53:55 } +2024-07-26 00:19:46,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1056/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.5821737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43523 samples/s/p 0:53:49 } +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1058/ 1625], loss: 1.155, per_step_time: 1478ms, lr: 2.5793431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.41139 samples/s/p 0:54:00 } +2024-07-26 00:19:52,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1060/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 2.5765178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:52,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43240 samples/s/p 0:53:45 } +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1062/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 2.573695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.44089 samples/s/p 0:53:37 } +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1064/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5708741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43440 samples/s/p 0:53:38 } +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1066/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.568054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43286 samples/s/p 0:53:35 } +2024-07-26 00:20:04,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1068/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.5652375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:04,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.42688 samples/s/p 0:53:36 } +2024-07-26 00:20:07,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1070/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 2.5624233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43374 samples/s/p 0:53:29 } +2024-07-26 00:20:10,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1072/ 1625], loss: 1.112, per_step_time: 1477ms, lr: 2.5596119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.41437 samples/s/p 0:53:38 } +2024-07-26 00:20:13,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1074/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.556802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43720 samples/s/p 0:53:21 } +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1076/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.5539966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43262 samples/s/p 0:53:21 } +2024-07-26 00:20:19,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1078/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.5511913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43898 samples/s/p 0:53:14 } +2024-07-26 00:20:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1080/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5483885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:22,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43260 samples/s/p 0:53:15 } +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1082/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.54559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42926 samples/s/p 0:53:14 } +2024-07-26 00:20:28,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1084/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.5427914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44244 samples/s/p 0:53:03 } +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1086/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.5399972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43005 samples/s/p 0:53:08 } +2024-07-26 00:20:33,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1088/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.5372049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:33,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43247 samples/s/p 0:53:03 } +2024-07-26 00:20:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1090/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 2.5344134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43952 samples/s/p 0:52:56 } +2024-07-26 00:20:39,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1092/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 2.5316276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42707 samples/s/p 0:53:01 } +2024-07-26 00:20:42,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1094/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.5288423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:42,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43344 samples/s/p 0:52:54 } +2024-07-26 00:20:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1096/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 2.5260574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.41836 samples/s/p 0:53:00 } +2024-07-26 00:20:48,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1098/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.523278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43186 samples/s/p 0:52:49 } +2024-07-26 00:20:51,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1100/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 2.5204995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42899 samples/s/p 0:52:48 } +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1102/ 1625], loss: 1.340, per_step_time: 1473ms, lr: 2.5177233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42887 samples/s/p 0:52:45 } +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1104/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.514951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43407 samples/s/p 0:52:39 } +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1106/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.512179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43606 samples/s/p 0:52:35 } +2024-07-26 00:21:03,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1108/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.50941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42997 samples/s/p 0:52:35 } +2024-07-26 00:21:06,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1110/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.5066433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43101 samples/s/p 0:52:32 } +2024-07-26 00:21:09,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1112/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 2.5038803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.44395 samples/s/p 0:52:21 } +2024-07-26 00:21:12,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1114/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.501119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:12,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43469 samples/s/p 0:52:24 } +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1116/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.4983597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43531 samples/s/p 0:52:20 } +2024-07-26 00:21:18,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1118/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.4956034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:18,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43685 samples/s/p 0:52:17 } +2024-07-26 00:21:21,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1120/ 1625], loss: 1.251, per_step_time: 1474ms, lr: 2.49285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:21,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42619 samples/s/p 0:52:20 } +2024-07-26 00:21:24,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1122/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 2.4900962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:24,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43244 samples/s/p 0:52:13 } +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1124/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.487347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43144 samples/s/p 0:52:11 } +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1126/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.4846013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43113 samples/s/p 0:52:08 } +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1128/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.4818555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43838 samples/s/p 0:52:01 } +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1130/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.4791148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.42795 samples/s/p 0:52:04 } +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1132/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.4763742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43635 samples/s/p 0:51:56 } +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1134/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.4736355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43046 samples/s/p 0:51:57 } +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1136/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.4709016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43079 samples/s/p 0:51:54 } +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1138/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.468169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43301 samples/s/p 0:51:49 } +2024-07-26 00:21:50,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1140/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.4654378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:50,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43163 samples/s/p 0:51:47 } +2024-07-26 00:21:53,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1142/ 1625], loss: 1.329, per_step_time: 1473ms, lr: 2.462711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:53,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43072 samples/s/p 0:51:45 } +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1144/ 1625], loss: 0.891, per_step_time: 1471ms, lr: 2.4599851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43804 samples/s/p 0:51:38 } +2024-07-26 00:21:59,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1146/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.4572619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:59,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43371 samples/s/p 0:51:37 } +2024-07-26 00:22:02,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1148/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.454542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42994 samples/s/p 0:51:36 } +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1150/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.451823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43904 samples/s/p 0:51:28 } +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1152/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.4491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43672 samples/s/p 0:51:27 } +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1154/ 1625], loss: 1.103, per_step_time: 1474ms, lr: 2.4463939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42546 samples/s/p 0:51:30 } +2024-07-26 00:22:14,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1156/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.4436843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:14,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43942 samples/s/p 0:51:19 } +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1158/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.4409746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43582 samples/s/p 0:51:18 } +2024-07-26 00:22:20,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1160/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.438269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43466 samples/s/p 0:51:16 } +2024-07-26 00:22:23,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1162/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.4355654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43476 samples/s/p 0:51:13 } +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1164/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.4328629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43405 samples/s/p 0:51:11 } +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1166/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.4301635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43492 samples/s/p 0:51:07 } +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1168/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.427468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.42430 samples/s/p 0:51:10 } +2024-07-26 00:22:34,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1170/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.424775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:34,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43910 samples/s/p 0:50:59 } +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1172/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.4220817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43321 samples/s/p 0:50:59 } +2024-07-26 00:22:40,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1174/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 2.4193941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43938 samples/s/p 0:50:53 } +2024-07-26 00:22:43,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1176/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.416707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:43,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.44040 samples/s/p 0:50:49 } +2024-07-26 00:22:46,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1178/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.4140209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:46,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43393 samples/s/p 0:50:50 } +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1180/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.41134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43735 samples/s/p 0:50:45 } +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1182/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4086607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.44182 samples/s/p 0:50:40 } +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1184/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.4059823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43425 samples/s/p 0:50:41 } +2024-07-26 00:22:58,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1186/ 1625], loss: 1.133, per_step_time: 1474ms, lr: 2.4033093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:58,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.42389 samples/s/p 0:50:44 } +2024-07-26 00:23:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1188/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.4006358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:01,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43465 samples/s/p 0:50:35 } +2024-07-26 00:23:04,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1190/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.3979662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43075 samples/s/p 0:50:34 } +2024-07-26 00:23:07,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1192/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.3952991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43620 samples/s/p 0:50:28 } +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1194/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.3926336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43592 samples/s/p 0:50:25 } +2024-07-26 00:23:13,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1196/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 2.3899709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:13,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43380 samples/s/p 0:50:24 } +2024-07-26 00:23:16,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1198/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.38731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:16,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43429 samples/s/p 0:50:20 } +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1200/ 1625], loss: 1.066, per_step_time: 1484ms, lr: 2.3846521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.38913 samples/s/p 0:50:43 } +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1202/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3819962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43278 samples/s/p 0:50:15 } +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1204/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.3793439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43992 samples/s/p 0:50:08 } +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1206/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.3766931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:28,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43616 samples/s/p 0:50:08 } +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1208/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 2.374045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43646 samples/s/p 0:50:04 } +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1210/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3713997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43131 samples/s/p 0:50:04 } +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1212/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3687567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43794 samples/s/p 0:49:58 } +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1214/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.3661146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43338 samples/s/p 0:49:57 } +2024-07-26 00:23:42,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1216/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.363476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:42,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43363 samples/s/p 0:49:54 } +2024-07-26 00:23:45,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1218/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3608425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43239 samples/s/p 0:49:52 } +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1220/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 2.3582083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43007 samples/s/p 0:49:50 } +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1222/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.3555756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43845 samples/s/p 0:49:43 } +2024-07-26 00:23:54,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1224/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.3529483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:54,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43337 samples/s/p 0:49:43 } +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1226/ 1625], loss: 1.151, per_step_time: 1474ms, lr: 2.3503226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.42654 samples/s/p 0:49:43 } +2024-07-26 00:24:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1228/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 2.3476969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.42936 samples/s/p 0:49:39 } +2024-07-26 00:24:03,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1230/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3450757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43098 samples/s/p 0:49:35 } +2024-07-26 00:24:06,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1232/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.3424568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43544 samples/s/p 0:49:30 } +2024-07-26 00:24:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1234/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.3398406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:09,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44056 samples/s/p 0:49:24 } +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1236/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.3372272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44088 samples/s/p 0:49:21 } +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1238/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.3346147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43793 samples/s/p 0:49:19 } +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1240/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 2.3320054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43371 samples/s/p 0:49:19 } +2024-07-26 00:24:21,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.3293978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:21,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43072 samples/s/p 0:49:17 } +2024-07-26 00:24:24,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1244/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.326794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43235 samples/s/p 0:49:14 } +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1246/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.3241914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43728 samples/s/p 0:49:08 } +2024-07-26 00:24:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1248/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.3215916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42583 samples/s/p 0:49:11 } +2024-07-26 00:24:33,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1250/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.3189946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43123 samples/s/p 0:49:05 } +2024-07-26 00:24:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1252/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.3164002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43215 samples/s/p 0:49:02 } +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1254/ 1625], loss: 1.057, per_step_time: 1472ms, lr: 2.3138073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43457 samples/s/p 0:48:58 } +2024-07-26 00:24:41,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1256/ 1625], loss: 1.316, per_step_time: 1474ms, lr: 2.3112189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:41,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42675 samples/s/p 0:48:59 } +2024-07-26 00:24:44,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1258/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 2.3086304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:44,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43209 samples/s/p 0:48:53 } +2024-07-26 00:24:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1260/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.3060452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44072 samples/s/p 0:48:46 } +2024-07-26 00:24:50,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1262/ 1625], loss: 1.269, per_step_time: 1474ms, lr: 2.3034638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:50,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.42708 samples/s/p 0:48:50 } +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1264/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3008822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43322 samples/s/p 0:48:44 } +2024-07-26 00:24:56,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1266/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.298304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43713 samples/s/p 0:48:39 } +2024-07-26 00:24:59,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1268/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.295731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:59,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43452 samples/s/p 0:48:37 } +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1270/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 2.2931574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43947 samples/s/p 0:48:32 } +2024-07-26 00:25:05,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1272/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 2.290587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44426 samples/s/p 0:48:26 } +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1274/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.2880185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43919 samples/s/p 0:48:26 } +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1276/ 1625], loss: 1.382, per_step_time: 1473ms, lr: 2.2854533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42995 samples/s/p 0:48:28 } +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1278/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.2828908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43463 samples/s/p 0:48:22 } +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1280/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.28033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44177 samples/s/p 0:48:16 } +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1282/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2777717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44031 samples/s/p 0:48:13 } +2024-07-26 00:25:23,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1284/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.275216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43718 samples/s/p 0:48:12 } +2024-07-26 00:25:26,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1286/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 2.2726622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42760 samples/s/p 0:48:14 } +2024-07-26 00:25:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1288/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2701108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43628 samples/s/p 0:48:07 } +2024-07-26 00:25:32,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1290/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 2.267563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:32,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43863 samples/s/p 0:48:03 } +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1292/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.265017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43687 samples/s/p 0:48:01 } +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1294/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 2.2624724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43457 samples/s/p 0:47:59 } +2024-07-26 00:25:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1296/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.2599315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:40,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.42527 samples/s/p 0:48:01 } +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1298/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 2.2573931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43709 samples/s/p 0:47:52 } +2024-07-26 00:25:46,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1300/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.254859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:46,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43473 samples/s/p 0:47:50 } +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1302/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 2.2523225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.42862 samples/s/p 0:47:50 } +2024-07-26 00:25:52,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1304/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.2497911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43534 samples/s/p 0:47:44 } +2024-07-26 00:25:55,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1306/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.2472648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43285 samples/s/p 0:47:42 } +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1308/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.244736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43911 samples/s/p 0:47:36 } +2024-07-26 00:26:01,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1310/ 1625], loss: 1.267, per_step_time: 1475ms, lr: 2.2422114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42215 samples/s/p 0:47:42 } +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1312/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.239692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43035 samples/s/p 0:47:35 } +2024-07-26 00:26:07,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1314/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.237171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:07,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43514 samples/s/p 0:47:29 } +2024-07-26 00:26:10,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1316/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 2.234656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:10,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42400 samples/s/p 0:47:32 } +2024-07-26 00:26:13,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1318/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.2321428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43197 samples/s/p 0:47:25 } +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1320/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 2.2296304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43238 samples/s/p 0:47:22 } +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1322/ 1625], loss: 1.075, per_step_time: 1475ms, lr: 2.2271213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42355 samples/s/p 0:47:23 } +2024-07-26 00:26:22,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1324/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.224614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43128 samples/s/p 0:47:16 } +2024-07-26 00:26:25,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1326/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.2221093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:25,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43136 samples/s/p 0:47:13 } +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1328/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.2196073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43183 samples/s/p 0:47:10 } +2024-07-26 00:26:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1330/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.217108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42579 samples/s/p 0:47:10 } +2024-07-26 00:26:34,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.21461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:34,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43498 samples/s/p 0:47:03 } +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1334/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 2.2121158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43704 samples/s/p 0:46:59 } +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1336/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2096242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43490 samples/s/p 0:46:57 } +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1338/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.2071342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43480 samples/s/p 0:46:54 } +2024-07-26 00:26:45,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1340/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.204648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:45,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43346 samples/s/p 0:46:52 } +2024-07-26 00:26:48,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1342/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.2021622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:48,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43872 samples/s/p 0:46:46 } +2024-07-26 00:26:51,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1344/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.1996816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:51,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43021 samples/s/p 0:46:47 } +2024-07-26 00:26:54,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1346/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.1971996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:54,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43354 samples/s/p 0:46:43 } +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1348/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 2.1947226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43352 samples/s/p 0:46:40 } +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1350/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.192249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43379 samples/s/p 0:46:37 } +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1352/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.1897754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43475 samples/s/p 0:46:33 } +2024-07-26 00:27:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1354/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.1873045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:06,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43629 samples/s/p 0:46:30 } +2024-07-26 00:27:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1356/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.1848386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:09,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43484 samples/s/p 0:46:27 } +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1358/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 2.182372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43867 samples/s/p 0:46:23 } +2024-07-26 00:27:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1360/ 1625], loss: 1.318, per_step_time: 1469ms, lr: 2.1799106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.44393 samples/s/p 0:46:17 } +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1362/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.1774501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43358 samples/s/p 0:46:19 } +2024-07-26 00:27:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1364/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 2.1749913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43331 samples/s/p 0:46:16 } +2024-07-26 00:27:24,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1366/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1725377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43370 samples/s/p 0:46:13 } +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1368/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.1700848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43129 samples/s/p 0:46:12 } +2024-07-26 00:27:30,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1370/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.1676337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.42937 samples/s/p 0:46:10 } +2024-07-26 00:27:33,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1372/ 1625], loss: 1.053, per_step_time: 1470ms, lr: 2.1651854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43874 samples/s/p 0:46:02 } +2024-07-26 00:27:36,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1374/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1627402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:36,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43692 samples/s/p 0:46:00 } +2024-07-26 00:27:39,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1376/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.160297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:39,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43592 samples/s/p 0:45:57 } +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1378/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.1578562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43398 samples/s/p 0:45:55 } +2024-07-26 00:27:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1380/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.1554192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:44,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43183 samples/s/p 0:45:54 } +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1382/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.1529827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43530 samples/s/p 0:45:49 } +2024-07-26 00:27:50,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1384/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.1505498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:50,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43376 samples/s/p 0:45:47 } +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1386/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.1481196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.42922 samples/s/p 0:45:46 } +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1388/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.1456926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43516 samples/s/p 0:45:40 } +2024-07-26 00:27:59,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1390/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.1432647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.44095 samples/s/p 0:45:34 } +2024-07-26 00:28:02,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1392/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.1408423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43273 samples/s/p 0:45:36 } +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1394/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.1384217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43601 samples/s/p 0:45:31 } +2024-07-26 00:28:08,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1396/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1360033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:08,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43000 samples/s/p 0:45:31 } +2024-07-26 00:28:11,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1398/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1335868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43777 samples/s/p 0:45:24 } +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1400/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1311748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43617 samples/s/p 0:45:22 } +2024-07-26 00:28:17,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1402/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.1287624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43686 samples/s/p 0:45:19 } +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1404/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1263554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.42858 samples/s/p 0:45:20 } +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1406/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.1239493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43599 samples/s/p 0:45:13 } +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1408/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.1215442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43498 samples/s/p 0:45:11 } +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1410/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.119145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43794 samples/s/p 0:45:06 } +2024-07-26 00:28:32,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1412/ 1625], loss: 0.981, per_step_time: 1471ms, lr: 2.1167457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43505 samples/s/p 0:45:05 } +2024-07-26 00:28:35,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1414/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.1143492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43428 samples/s/p 0:45:02 } +2024-07-26 00:28:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1416/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 2.111955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43621 samples/s/p 0:44:58 } +2024-07-26 00:28:40,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1418/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.1095645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43752 samples/s/p 0:44:55 } +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1420/ 1625], loss: 1.351, per_step_time: 1470ms, lr: 2.1071755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43941 samples/s/p 0:44:51 } +2024-07-26 00:28:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1422/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1047895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43562 samples/s/p 0:44:50 } +2024-07-26 00:28:49,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1424/ 1625], loss: 0.926, per_step_time: 1470ms, lr: 2.1024048e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:49,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43849 samples/s/p 0:44:46 } +2024-07-26 00:28:52,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1426/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.1000246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:52,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43629 samples/s/p 0:44:44 } +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1428/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.0976454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.42900 samples/s/p 0:44:44 } +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1430/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.0952687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43975 samples/s/p 0:44:36 } +2024-07-26 00:29:01,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1432/ 1625], loss: 0.986, per_step_time: 1472ms, lr: 2.0928962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:01,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43237 samples/s/p 0:44:37 } +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1434/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.0905238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43556 samples/s/p 0:44:32 } +2024-07-26 00:29:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1436/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.088154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:07,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43403 samples/s/p 0:44:30 } +2024-07-26 00:29:10,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1438/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.0857894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:10,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43515 samples/s/p 0:44:27 } +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1440/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.0834239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43535 samples/s/p 0:44:24 } +2024-07-26 00:29:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1442/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.0810635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43675 samples/s/p 0:44:20 } +2024-07-26 00:29:19,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1444/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.0787043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:19,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43366 samples/s/p 0:44:18 } +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1446/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.0763464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43496 samples/s/p 0:44:15 } +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1448/ 1625], loss: 0.923, per_step_time: 1473ms, lr: 2.073995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43063 samples/s/p 0:44:14 } +2024-07-26 00:29:28,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1450/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.0716423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:28,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43216 samples/s/p 0:44:10 } +2024-07-26 00:29:31,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1452/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.0692923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43570 samples/s/p 0:44:06 } +2024-07-26 00:29:34,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1454/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 2.0669459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43280 samples/s/p 0:44:04 } +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1456/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 2.0646019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43172 samples/s/p 0:44:02 } +2024-07-26 00:29:40,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1458/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.0622606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:40,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43023 samples/s/p 0:44:00 } +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1460/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.059921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43589 samples/s/p 0:43:54 } +2024-07-26 00:29:45,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1462/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 2.0575849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43866 samples/s/p 0:43:50 } +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1464/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.0552507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43429 samples/s/p 0:43:49 } +2024-07-26 00:29:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1466/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.0529178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.42838 samples/s/p 0:43:49 } +2024-07-26 00:29:54,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1468/ 1625], loss: 1.038, per_step_time: 1473ms, lr: 2.0505895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43060 samples/s/p 0:43:45 } +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1470/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.048264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43039 samples/s/p 0:43:42 } +2024-07-26 00:30:00,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1472/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.045938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:00,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42986 samples/s/p 0:43:39 } +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1474/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.0436166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42952 samples/s/p 0:43:36 } +2024-07-26 00:30:06,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1476/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.0412986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43055 samples/s/p 0:43:33 } +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1478/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 2.0389798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44130 samples/s/p 0:43:25 } +2024-07-26 00:30:12,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1480/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.0366654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43762 samples/s/p 0:43:24 } +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.034355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44104 samples/s/p 0:43:19 } +2024-07-26 00:30:18,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1484/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.032044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43897 samples/s/p 0:43:17 } +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1486/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0297382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:21,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44073 samples/s/p 0:43:13 } +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1488/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.0274342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43604 samples/s/p 0:43:13 } +2024-07-26 00:30:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1490/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.025131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43953 samples/s/p 0:43:08 } +2024-07-26 00:30:30,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1492/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.0228326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43578 samples/s/p 0:43:07 } +2024-07-26 00:30:33,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1494/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0205355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43687 samples/s/p 0:43:03 } +2024-07-26 00:30:36,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1496/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.0182401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.44162 samples/s/p 0:42:58 } +2024-07-26 00:30:39,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1498/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.0159487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43683 samples/s/p 0:42:57 } +2024-07-26 00:30:41,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1500/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.0136595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:41,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43740 samples/s/p 0:42:54 } +2024-07-26 00:30:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1502/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0113716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43415 samples/s/p 0:42:53 } +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1504/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.0090874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43966 samples/s/p 0:42:47 } +2024-07-26 00:30:50,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1506/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.0068057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:50,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43881 samples/s/p 0:42:45 } +2024-07-26 00:30:53,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1508/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 2.0045259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43911 samples/s/p 0:42:42 } +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1510/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.0022485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43914 samples/s/p 0:42:39 } +2024-07-26 00:30:59,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1512/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.9999738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:59,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43569 samples/s/p 0:42:37 } +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1514/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.9977024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43735 samples/s/p 0:42:34 } +2024-07-26 00:31:05,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1516/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.9954318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43841 samples/s/p 0:42:30 } +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1518/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.9931658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.42999 samples/s/p 0:42:31 } +2024-07-26 00:31:11,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1520/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.9909023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:11,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43995 samples/s/p 0:42:24 } +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1522/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.988638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43621 samples/s/p 0:42:22 } +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1524/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9863796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44184 samples/s/p 0:42:17 } +2024-07-26 00:31:20,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1526/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9841232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44052 samples/s/p 0:42:15 } +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1528/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.9818672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43526 samples/s/p 0:42:14 } +2024-07-26 00:31:26,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1530/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.9796166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:26,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43895 samples/s/p 0:42:09 } +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1532/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.977366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43420 samples/s/p 0:42:09 } +2024-07-26 00:31:32,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1534/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.9751183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.42800 samples/s/p 0:42:09 } +2024-07-26 00:31:35,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1536/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.9728745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:35,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43524 samples/s/p 0:42:02 } +2024-07-26 00:31:38,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1538/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.9706317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43293 samples/s/p 0:42:00 } +2024-07-26 00:31:40,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1540/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.9683916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:40,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43339 samples/s/p 0:41:57 } +2024-07-26 00:31:43,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1542/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 1.9661557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:43,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43087 samples/s/p 0:41:55 } +2024-07-26 00:31:46,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1544/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.9639208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.42808 samples/s/p 0:41:54 } +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1546/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.9616884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43191 samples/s/p 0:41:49 } +2024-07-26 00:31:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1548/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.9594595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.44187 samples/s/p 0:41:42 } +2024-07-26 00:31:55,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1550/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 1.9572321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:55,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43715 samples/s/p 0:41:41 } +2024-07-26 00:31:58,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1552/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 1.9550075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:58,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43095 samples/s/p 0:41:41 } +2024-07-26 00:32:01,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1554/ 1625], loss: 0.970, per_step_time: 1471ms, lr: 1.9527856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43805 samples/s/p 0:41:35 } +2024-07-26 00:32:04,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1556/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9505653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:04,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43544 samples/s/p 0:41:33 } +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1558/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.9483475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43680 samples/s/p 0:41:29 } +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1560/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.9461334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43088 samples/s/p 0:41:29 } +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1562/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.9439217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.44014 samples/s/p 0:41:22 } +2024-07-26 00:32:16,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1564/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.941711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:16,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43296 samples/s/p 0:41:22 } +2024-07-26 00:32:19,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1566/ 1625], loss: 1.263, per_step_time: 1476ms, lr: 1.9395043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:19,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.41894 samples/s/p 0:41:26 } +2024-07-26 00:32:22,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1568/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.9372997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43399 samples/s/p 0:41:16 } +2024-07-26 00:32:25,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1570/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.9350991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43800 samples/s/p 0:41:11 } +2024-07-26 00:32:28,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1572/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.932897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43435 samples/s/p 0:41:10 } +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1574/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.9307017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43391 samples/s/p 0:41:07 } +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1576/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9285076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43655 samples/s/p 0:41:03 } +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1578/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.926313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43869 samples/s/p 0:40:59 } +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1580/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.9241247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43410 samples/s/p 0:40:58 } +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1582/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.921938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43261 samples/s/p 0:40:56 } +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1584/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9197541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43533 samples/s/p 0:40:52 } +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1586/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.917571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.44080 samples/s/p 0:40:46 } +2024-07-26 00:32:51,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1588/ 1625], loss: 1.420, per_step_time: 1471ms, lr: 1.9153913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:51,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43757 samples/s/p 0:40:45 } +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1590/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.913215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43514 samples/s/p 0:40:43 } +2024-07-26 00:32:57,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 1.9110398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43926 samples/s/p 0:40:38 } +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1594/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.908868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43937 samples/s/p 0:40:35 } +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1596/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.9066994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43439 samples/s/p 0:40:34 } +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1598/ 1625], loss: 1.161, per_step_time: 1474ms, lr: 1.904531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.42679 samples/s/p 0:40:35 } +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1600/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.9023669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43239 samples/s/p 0:40:29 } +2024-07-26 00:33:12,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1602/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.9002052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:12,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43465 samples/s/p 0:40:25 } +2024-07-26 00:33:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1604/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.8980454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43448 samples/s/p 0:40:23 } +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1606/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.8958883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43574 samples/s/p 0:40:19 } +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1608/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 1.8937328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43620 samples/s/p 0:40:16 } +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1610/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 1.8915816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43253 samples/s/p 0:40:15 } +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1612/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.8894331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43305 samples/s/p 0:40:11 } +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1614/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.8872854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43471 samples/s/p 0:40:08 } +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1616/ 1625], loss: 1.144, per_step_time: 1474ms, lr: 1.8851403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.42724 samples/s/p 0:40:08 } +2024-07-26 00:33:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1618/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.8829994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:36,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.42981 samples/s/p 0:40:04 } +2024-07-26 00:33:39,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1620/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.8808604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43854 samples/s/p 0:39:57 } +2024-07-26 00:33:41,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1622/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.8787222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:41,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43455 samples/s/p 0:39:56 } +2024-07-26 00:33:44,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1624/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.8765884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43742 samples/s/p 0:39:52 } +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.874457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43518 samples/s/p 0:39:50 } +2024-07-26 00:33:50,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 3/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.8723283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43409 samples/s/p 0:39:47 } +2024-07-26 00:33:53,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 5/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8702005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43237 samples/s/p 0:39:45 } +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 7/ 1625], loss: 1.157, per_step_time: 1475ms, lr: 1.8680762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.42339 samples/s/p 0:39:46 } +2024-07-26 00:33:59,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 9/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.8659543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:59,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43368 samples/s/p 0:39:39 } +2024-07-26 00:34:02,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 11/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.8638343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44151 samples/s/p 0:39:32 } +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 13/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 1.8617186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:05,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.42428 samples/s/p 0:39:37 } +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 15/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.8596038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44075 samples/s/p 0:39:27 } +2024-07-26 00:34:11,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 17/ 1625], loss: 0.964, per_step_time: 1470ms, lr: 1.8574915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:11,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43920 samples/s/p 0:39:25 } +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 19/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.8553835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43358 samples/s/p 0:39:24 } +2024-07-26 00:34:17,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 21/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 1.8532755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44324 samples/s/p 0:39:17 } +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 23/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.8511719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43372 samples/s/p 0:39:18 } +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 25/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.84907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43313 samples/s/p 0:39:15 } +2024-07-26 00:34:26,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 27/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 1.8469707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:26,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43717 samples/s/p 0:39:11 } +2024-07-26 00:34:29,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 29/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8448749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43051 samples/s/p 0:39:11 } +2024-07-26 00:34:32,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 31/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.8427816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:32,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43552 samples/s/p 0:39:06 } +2024-07-26 00:34:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 33/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.8406874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:35,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43561 samples/s/p 0:39:03 } +2024-07-26 00:34:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 35/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.8385986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43645 samples/s/p 0:38:59 } +2024-07-26 00:34:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 37/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.836514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43474 samples/s/p 0:38:57 } +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 39/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.8344285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43727 samples/s/p 0:38:53 } +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 41/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.8323465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43460 samples/s/p 0:38:51 } +2024-07-26 00:34:49,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 43/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.8302687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43515 samples/s/p 0:38:48 } +2024-07-26 00:34:52,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 45/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.8281928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:52,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43651 samples/s/p 0:38:45 } +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 47/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.8261185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:55,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43000 samples/s/p 0:38:44 } +2024-07-26 00:34:58,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 49/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8240469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43438 samples/s/p 0:38:40 } +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 51/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.8219787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43384 samples/s/p 0:38:37 } +2024-07-26 00:35:04,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 53/ 1625], loss: 1.175, per_step_time: 1474ms, lr: 1.8199123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:04,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.42641 samples/s/p 0:38:37 } +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 55/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.8178475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43744 samples/s/p 0:38:29 } +2024-07-26 00:35:10,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 57/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 1.8157862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:10,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.44105 samples/s/p 0:38:25 } +2024-07-26 00:35:13,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 59/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.8137284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43662 samples/s/p 0:38:24 } +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 61/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 1.8116714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43046 samples/s/p 0:38:24 } +2024-07-26 00:35:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 63/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.8096171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:19,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43511 samples/s/p 0:38:19 } +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 65/ 1625], loss: 0.928, per_step_time: 1472ms, lr: 1.8075671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43156 samples/s/p 0:38:17 } +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 67/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 1.8055188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42784 samples/s/p 0:38:16 } +2024-07-26 00:35:28,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 69/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 1.8034722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:28,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42510 samples/s/p 0:38:14 } +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 71/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.8014273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42885 samples/s/p 0:38:09 } +2024-07-26 00:35:34,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 73/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.7993868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:34,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43539 samples/s/p 0:38:04 } +2024-07-26 00:35:37,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 75/ 1625], loss: 0.976, per_step_time: 1474ms, lr: 1.7973497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42432 samples/s/p 0:38:05 } +2024-07-26 00:35:40,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 77/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7953125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:40,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43757 samples/s/p 0:37:57 } +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 79/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 1.793279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43405 samples/s/p 0:37:56 } +2024-07-26 00:35:45,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 81/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.7912497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:45,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43409 samples/s/p 0:37:53 } +2024-07-26 00:35:48,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 83/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.7892187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43244 samples/s/p 0:37:50 } +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 85/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7871937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43094 samples/s/p 0:37:48 } +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 87/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.7851713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43133 samples/s/p 0:37:45 } +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 89/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.783149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42858 samples/s/p 0:37:43 } +2024-07-26 00:36:00,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 91/ 1625], loss: 0.966, per_step_time: 1469ms, lr: 1.7811317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.44338 samples/s/p 0:37:34 } +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 93/ 1625], loss: 1.217, per_step_time: 1478ms, lr: 1.7791153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.41223 samples/s/p 0:37:44 } +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 95/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.7771025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.42932 samples/s/p 0:37:34 } +2024-07-26 00:36:09,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 97/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.7750922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43968 samples/s/p 0:37:27 } +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 99/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.7730837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43657 samples/s/p 0:37:25 } +2024-07-26 00:36:15,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 101/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7710777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43742 samples/s/p 0:37:22 } +2024-07-26 00:36:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 103/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.7690743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.44003 samples/s/p 0:37:18 } +2024-07-26 00:36:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 105/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7670752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43275 samples/s/p 0:37:18 } +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 107/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 1.7650761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43723 samples/s/p 0:37:13 } +2024-07-26 00:36:27,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 109/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.7630806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:27,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43655 samples/s/p 0:37:10 } +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 111/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7610876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43052 samples/s/p 0:37:10 } +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 113/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.759098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43205 samples/s/p 0:37:06 } +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 115/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.7571094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43290 samples/s/p 0:37:03 } +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 117/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 1.7551233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43865 samples/s/p 0:36:58 } +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 119/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7531424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:42,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43157 samples/s/p 0:36:58 } +2024-07-26 00:36:44,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 121/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.7511607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.44046 samples/s/p 0:36:51 } +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 123/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.7491832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43547 samples/s/p 0:36:50 } +2024-07-26 00:36:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 125/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.7472075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43751 samples/s/p 0:36:46 } +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 127/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.7452353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43573 samples/s/p 0:36:44 } +2024-07-26 00:36:56,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 129/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7432646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43874 samples/s/p 0:36:40 } +2024-07-26 00:36:59,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 131/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.7412976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:59,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43749 samples/s/p 0:36:38 } +2024-07-26 00:37:02,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 133/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.7393314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43748 samples/s/p 0:36:35 } +2024-07-26 00:37:05,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 135/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 1.7373695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:05,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.42990 samples/s/p 0:36:35 } +2024-07-26 00:37:08,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 137/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.7354103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:08,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43211 samples/s/p 0:36:31 } +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 139/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.733451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43546 samples/s/p 0:36:27 } +2024-07-26 00:37:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 141/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.7314977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43493 samples/s/p 0:36:24 } +2024-07-26 00:37:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 143/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.7295454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43132 samples/s/p 0:36:22 } +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 145/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7275947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42978 samples/s/p 0:36:20 } +2024-07-26 00:37:23,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 147/ 1625], loss: 0.965, per_step_time: 1474ms, lr: 1.7256475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:23,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42488 samples/s/p 0:36:19 } +2024-07-26 00:37:26,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 149/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 1.7237029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:26,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43145 samples/s/p 0:36:14 } +2024-07-26 00:37:29,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 151/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.7217609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:29,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42959 samples/s/p 0:36:11 } +2024-07-26 00:37:32,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 153/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.7198215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43222 samples/s/p 0:36:07 } +2024-07-26 00:37:35,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 155/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7178838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43220 samples/s/p 0:36:04 } +2024-07-26 00:37:38,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 157/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7159505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:38,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43844 samples/s/p 0:35:59 } +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 159/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.7140179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43370 samples/s/p 0:35:58 } +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 161/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.712088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43789 samples/s/p 0:35:53 } +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 163/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.7101625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43641 samples/s/p 0:35:51 } +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 165/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.7082368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43458 samples/s/p 0:35:49 } +2024-07-26 00:37:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 167/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.7063146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:52,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43628 samples/s/p 0:35:45 } +2024-07-26 00:37:55,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 169/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.7043969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:55,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43091 samples/s/p 0:35:44 } +2024-07-26 00:37:58,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 171/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.702479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43395 samples/s/p 0:35:40 } +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 173/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.7005664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43717 samples/s/p 0:35:36 } +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 175/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6986538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43278 samples/s/p 0:35:35 } +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 177/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.6967438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43514 samples/s/p 0:35:31 } +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 179/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 1.6948381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43998 samples/s/p 0:35:26 } +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 181/ 1625], loss: 1.048, per_step_time: 1469ms, lr: 1.6929341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44425 samples/s/p 0:35:21 } +2024-07-26 00:38:16,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 183/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.691031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:16,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43922 samples/s/p 0:35:20 } +2024-07-26 00:38:19,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 185/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.6891331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:19,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43506 samples/s/p 0:35:19 } +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 187/ 1625], loss: 1.160, per_step_time: 1475ms, lr: 1.6872377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42162 samples/s/p 0:35:21 } +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 189/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.6853432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43444 samples/s/p 0:35:13 } +2024-07-26 00:38:28,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 191/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6834522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43230 samples/s/p 0:35:11 } +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 193/ 1625], loss: 1.224, per_step_time: 1474ms, lr: 1.6815638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42560 samples/s/p 0:35:11 } +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 195/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.6796771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:34,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43632 samples/s/p 0:35:04 } +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 197/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 1.6777931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43422 samples/s/p 0:35:02 } +2024-07-26 00:38:40,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 199/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 1.6759124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43509 samples/s/p 0:34:58 } +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 201/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.6740352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.44150 samples/s/p 0:34:53 } +2024-07-26 00:38:45,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 203/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.6721572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:45,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43358 samples/s/p 0:34:53 } +2024-07-26 00:38:48,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 205/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 1.6702834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:48,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43136 samples/s/p 0:34:51 } +2024-07-26 00:38:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 207/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.6684139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43496 samples/s/p 0:34:47 } +2024-07-26 00:38:54,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 209/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.6665446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:54,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43662 samples/s/p 0:34:43 } +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 211/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 1.6646795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.42939 samples/s/p 0:34:43 } +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 213/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.662817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43108 samples/s/p 0:34:39 } +2024-07-26 00:39:03,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 215/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:03,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43577 samples/s/p 0:34:35 } +2024-07-26 00:39:06,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 217/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.659098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:06,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43984 samples/s/p 0:34:30 } +2024-07-26 00:39:09,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 219/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.6572433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:09,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43505 samples/s/p 0:34:29 } +2024-07-26 00:39:12,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 221/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.6553886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:12,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43211 samples/s/p 0:34:27 } +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 223/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.6535391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43612 samples/s/p 0:34:23 } +2024-07-26 00:39:18,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 225/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.6516913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:18,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.44106 samples/s/p 0:34:18 } +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 227/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.6498452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.42997 samples/s/p 0:34:19 } +2024-07-26 00:39:24,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 229/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.6480035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:24,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43501 samples/s/p 0:34:14 } +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 231/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.6461626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43424 samples/s/p 0:34:12 } +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 233/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.644326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43489 samples/s/p 0:34:08 } +2024-07-26 00:39:33,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 235/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.6424902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43885 samples/s/p 0:34:04 } +2024-07-26 00:39:36,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 237/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.6406572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:36,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43363 samples/s/p 0:34:03 } +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 239/ 1625], loss: 1.005, per_step_time: 1471ms, lr: 1.6388275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43843 samples/s/p 0:33:58 } +2024-07-26 00:39:42,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 241/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.6369995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:42,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43750 samples/s/p 0:33:56 } +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 243/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.6351751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43499 samples/s/p 0:33:54 } +2024-07-26 00:39:47,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 245/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.6333532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:47,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43746 samples/s/p 0:33:50 } +2024-07-26 00:39:50,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 247/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.6315331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43963 samples/s/p 0:33:46 } +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 249/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.6297164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43188 samples/s/p 0:33:46 } +2024-07-26 00:39:56,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 251/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.6279023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:56,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43177 samples/s/p 0:33:43 } +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 253/ 1625], loss: 0.906, per_step_time: 1473ms, lr: 1.626089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43070 samples/s/p 0:33:41 } +2024-07-26 00:40:02,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 255/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 1.6242784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:02,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43010 samples/s/p 0:33:38 } +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 257/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.6224739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43551 samples/s/p 0:33:33 } +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 259/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 1.6206675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43670 samples/s/p 0:33:30 } +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 261/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.618868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43691 samples/s/p 0:33:27 } +2024-07-26 00:40:14,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 263/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.6170687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43811 samples/s/p 0:33:23 } +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 265/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.6152701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43704 samples/s/p 0:33:21 } +2024-07-26 00:40:20,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 267/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.6134777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:20,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43950 samples/s/p 0:33:17 } +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 269/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.611686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43624 samples/s/p 0:33:15 } +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 271/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.609897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43298 samples/s/p 0:33:13 } +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 273/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6081106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:29,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43269 samples/s/p 0:33:10 } +2024-07-26 00:40:32,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 275/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6063259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43847 samples/s/p 0:33:05 } +2024-07-26 00:40:35,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 277/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.6045447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43983 samples/s/p 0:33:02 } +2024-07-26 00:40:38,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 279/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.6027659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:38,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44054 samples/s/p 0:32:59 } +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 281/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.6009908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44104 samples/s/p 0:32:56 } +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 283/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.5992164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43640 samples/s/p 0:32:54 } +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 285/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.5974456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43674 samples/s/p 0:32:51 } +2024-07-26 00:40:49,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 287/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.5956773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:49,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43917 samples/s/p 0:32:47 } +2024-07-26 00:40:52,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 289/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 1.5939098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43136 samples/s/p 0:32:47 } +2024-07-26 00:40:55,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 291/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.5921476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:55,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43317 samples/s/p 0:32:44 } +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 293/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.590387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43947 samples/s/p 0:32:39 } +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 295/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.5886292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43880 samples/s/p 0:32:36 } +2024-07-26 00:41:04,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 297/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5868729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:04,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43393 samples/s/p 0:32:35 } +2024-07-26 00:41:07,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 299/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.5851193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:07,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.42995 samples/s/p 0:32:33 } +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 301/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.58337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43462 samples/s/p 0:32:28 } +2024-07-26 00:41:13,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 303/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.5816208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43708 samples/s/p 0:32:25 } +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 305/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.5798759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44076 samples/s/p 0:32:20 } +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 307/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.5781335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43517 samples/s/p 0:32:19 } +2024-07-26 00:41:22,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 309/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 1.5763919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:22,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43020 samples/s/p 0:32:18 } +2024-07-26 00:41:25,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 311/ 1625], loss: 0.902, per_step_time: 1470ms, lr: 1.5746565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44122 samples/s/p 0:32:11 } +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 313/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 1.5729202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44158 samples/s/p 0:32:08 } +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 315/ 1625], loss: 1.332, per_step_time: 1471ms, lr: 1.5711882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43500 samples/s/p 0:32:08 } +2024-07-26 00:41:34,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 317/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5694588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:34,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43608 samples/s/p 0:32:04 } +2024-07-26 00:41:37,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 319/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.5677294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43778 samples/s/p 0:32:01 } +2024-07-26 00:41:40,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 321/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 1.5660053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43428 samples/s/p 0:31:59 } +2024-07-26 00:41:42,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 323/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 1.5642827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43258 samples/s/p 0:31:57 } +2024-07-26 00:41:45,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 325/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.5625645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:45,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43912 samples/s/p 0:31:52 } +2024-07-26 00:41:48,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 327/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.5608464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:48,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43074 samples/s/p 0:31:52 } +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 329/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 1.5591326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43555 samples/s/p 0:31:47 } +2024-07-26 00:41:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 331/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.5574204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:54,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43600 samples/s/p 0:31:44 } +2024-07-26 00:41:57,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 333/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.55571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43710 samples/s/p 0:31:41 } +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 335/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.554004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43382 samples/s/p 0:31:39 } +2024-07-26 00:42:03,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 337/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5523005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:03,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43608 samples/s/p 0:31:35 } +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 339/ 1625], loss: 0.954, per_step_time: 1474ms, lr: 1.5505988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.42733 samples/s/p 0:31:35 } +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 341/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.5488988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43807 samples/s/p 0:31:28 } +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 343/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.547204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.44034 samples/s/p 0:31:25 } +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 345/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.54551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43276 samples/s/p 0:31:24 } +2024-07-26 00:42:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 347/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.5438169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43439 samples/s/p 0:31:21 } +2024-07-26 00:42:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 349/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.542129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:21,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43232 samples/s/p 0:31:19 } +2024-07-26 00:42:24,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 351/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5404419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43207 samples/s/p 0:31:16 } +2024-07-26 00:42:27,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 353/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 1.5387584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43468 samples/s/p 0:31:12 } +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 355/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 1.5370773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43099 samples/s/p 0:31:10 } +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.535399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.44125 samples/s/p 0:31:04 } +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 359/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.5337239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43890 samples/s/p 0:31:02 } +2024-07-26 00:42:39,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 361/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5320508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43531 samples/s/p 0:31:00 } +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 363/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 1.5303801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43797 samples/s/p 0:30:56 } +2024-07-26 00:42:44,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 365/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 1.5287121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.42623 samples/s/p 0:30:57 } +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 367/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.5270457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43363 samples/s/p 0:30:52 } +2024-07-26 00:42:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 369/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.5253838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43556 samples/s/p 0:30:48 } +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 371/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.5237226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43530 samples/s/p 0:30:45 } +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 373/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.5220651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43402 samples/s/p 0:30:43 } +2024-07-26 00:42:59,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 375/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.5204091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:59,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43343 samples/s/p 0:30:40 } +2024-07-26 00:43:02,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 377/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5187566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:02,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43255 samples/s/p 0:30:37 } +2024-07-26 00:43:05,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 379/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5171067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43782 samples/s/p 0:30:33 } +2024-07-26 00:43:08,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 381/ 1625], loss: 1.298, per_step_time: 1470ms, lr: 1.5154585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:08,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.44057 samples/s/p 0:30:29 } +2024-07-26 00:43:11,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 383/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.5138147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:11,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42942 samples/s/p 0:30:30 } +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 385/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.5121725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.44057 samples/s/p 0:30:23 } +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 387/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5105331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43290 samples/s/p 0:30:22 } +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 389/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.5088945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43232 samples/s/p 0:30:20 } +2024-07-26 00:43:23,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 391/ 1625], loss: 0.913, per_step_time: 1471ms, lr: 1.5072601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43519 samples/s/p 0:30:16 } +2024-07-26 00:43:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 393/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5056283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43694 samples/s/p 0:30:12 } +2024-07-26 00:43:29,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 395/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.5039984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43768 samples/s/p 0:30:09 } +2024-07-26 00:43:32,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 397/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.5023718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42406 samples/s/p 0:30:11 } +2024-07-26 00:43:35,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 399/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 1.5007479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:35,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43875 samples/s/p 0:30:03 } +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 401/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.4991265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43633 samples/s/p 0:30:01 } +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 403/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.4975077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43665 samples/s/p 0:29:58 } +2024-07-26 00:43:43,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 405/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.4958907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:43,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43544 samples/s/p 0:29:55 } +2024-07-26 00:43:46,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 407/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.4942771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:46,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43844 samples/s/p 0:29:51 } +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 409/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 1.4926661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43880 samples/s/p 0:29:48 } +2024-07-26 00:43:52,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 411/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.4910568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:52,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43723 samples/s/p 0:29:46 } +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 413/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.489451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43874 samples/s/p 0:29:42 } +2024-07-26 00:43:58,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 415/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.4878469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:58,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43178 samples/s/p 0:29:42 } +2024-07-26 00:44:01,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 417/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.4862454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:01,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44065 samples/s/p 0:29:36 } +2024-07-26 00:44:04,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 419/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.4846482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:04,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43611 samples/s/p 0:29:34 } +2024-07-26 00:44:07,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 421/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.4830528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43788 samples/s/p 0:29:31 } +2024-07-26 00:44:10,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 423/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.4814591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:10,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43509 samples/s/p 0:29:29 } +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 425/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.4798671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44422 samples/s/p 0:29:23 } +2024-07-26 00:44:16,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 427/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.4782795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43538 samples/s/p 0:29:23 } +2024-07-26 00:44:19,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 429/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.4766936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:19,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43565 samples/s/p 0:29:20 } +2024-07-26 00:44:22,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 431/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.475112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43337 samples/s/p 0:29:18 } +2024-07-26 00:44:25,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 433/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.4735303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:25,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43247 samples/s/p 0:29:15 } +2024-07-26 00:44:28,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 435/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.471953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:28,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43422 samples/s/p 0:29:11 } +2024-07-26 00:44:31,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 437/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4703784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43051 samples/s/p 0:29:10 } +2024-07-26 00:44:34,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 439/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 1.4688054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42937 samples/s/p 0:29:07 } +2024-07-26 00:44:37,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 441/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.4672358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43647 samples/s/p 0:29:02 } +2024-07-26 00:44:40,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 443/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 1.4656689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43055 samples/s/p 0:29:01 } +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 445/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.4641038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42995 samples/s/p 0:28:58 } +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.4625411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43668 samples/s/p 0:28:53 } +2024-07-26 00:44:48,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 449/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.4609811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43732 samples/s/p 0:28:50 } +2024-07-26 00:44:51,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 451/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.4594247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:51,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43326 samples/s/p 0:28:48 } +2024-07-26 00:44:54,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 453/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.4578698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43061 samples/s/p 0:28:46 } +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 455/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.4563193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43222 samples/s/p 0:28:43 } +2024-07-26 00:45:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 457/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4547705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:00,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43607 samples/s/p 0:28:38 } +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 459/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 1.4532227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.42447 samples/s/p 0:28:39 } +2024-07-26 00:45:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 461/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 1.451679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:06,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43849 samples/s/p 0:28:32 } +2024-07-26 00:45:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 463/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.4501372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:09,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43833 samples/s/p 0:28:29 } +2024-07-26 00:45:12,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 465/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.4485988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43816 samples/s/p 0:28:26 } +2024-07-26 00:45:15,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 467/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.447063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43587 samples/s/p 0:28:24 } +2024-07-26 00:45:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 469/ 1625], loss: 0.997, per_step_time: 1469ms, lr: 1.4455297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44244 samples/s/p 0:28:19 } +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 471/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4439984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43119 samples/s/p 0:28:19 } +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 473/ 1625], loss: 1.298, per_step_time: 1469ms, lr: 1.4424686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44395 samples/s/p 0:28:12 } +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 475/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.4409432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43244 samples/s/p 0:28:13 } +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 477/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.4394203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43441 samples/s/p 0:28:09 } +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 479/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4378983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44068 samples/s/p 0:28:05 } +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 481/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.4363816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43433 samples/s/p 0:28:04 } +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 483/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.4348656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43789 samples/s/p 0:28:00 } +2024-07-26 00:45:42,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 485/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.433354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43100 samples/s/p 0:27:59 } +2024-07-26 00:45:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 487/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 1.4318424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43971 samples/s/p 0:27:53 } +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 489/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.4303342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43737 samples/s/p 0:27:51 } +2024-07-26 00:45:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 491/ 1625], loss: 1.108, per_step_time: 1477ms, lr: 1.4288304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:50,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.41392 samples/s/p 0:27:55 } +2024-07-26 00:45:53,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 493/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.4273274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:53,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43089 samples/s/p 0:27:47 } +2024-07-26 00:45:56,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 495/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.4258262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.44113 samples/s/p 0:27:41 } +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 497/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.4243302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43751 samples/s/p 0:27:39 } +2024-07-26 00:46:02,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 499/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.4228359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43531 samples/s/p 0:27:37 } +2024-07-26 00:46:05,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.4213441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:05,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.42057 samples/s/p 0:27:38 } +2024-07-26 00:46:08,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 503/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 1.4198541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:08,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43540 samples/s/p 0:27:31 } +2024-07-26 00:46:11,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 505/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 1.4183668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43753 samples/s/p 0:27:27 } +2024-07-26 00:46:14,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 507/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4168819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:14,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43308 samples/s/p 0:27:26 } +2024-07-26 00:46:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 509/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.4154006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43761 samples/s/p 0:27:21 } +2024-07-26 00:46:20,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 511/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.4139218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43624 samples/s/p 0:27:19 } +2024-07-26 00:46:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 513/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.4124456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43343 samples/s/p 0:27:17 } +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 515/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.4109712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43718 samples/s/p 0:27:13 } +2024-07-26 00:46:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 517/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4094985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:29,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43127 samples/s/p 0:27:12 } +2024-07-26 00:46:32,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 519/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.4080318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:32,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42565 samples/s/p 0:27:10 } +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 521/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.4065643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43142 samples/s/p 0:27:06 } +2024-07-26 00:46:38,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 523/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.405102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:38,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42624 samples/s/p 0:27:04 } +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 525/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.4036414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43452 samples/s/p 0:26:59 } +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 527/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.4021816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43760 samples/s/p 0:26:55 } +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 529/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 1.4007279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.44224 samples/s/p 0:26:51 } +2024-07-26 00:46:49,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 531/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.3992742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:49,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43707 samples/s/p 0:26:49 } +2024-07-26 00:46:52,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 533/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.3978214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43241 samples/s/p 0:26:48 } +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 535/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3963754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43754 samples/s/p 0:26:43 } +2024-07-26 00:46:58,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 537/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.3949305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:58,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43803 samples/s/p 0:26:40 } +2024-07-26 00:47:01,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 539/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.3934862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:01,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43128 samples/s/p 0:26:39 } +2024-07-26 00:47:04,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 541/ 1625], loss: 1.221, per_step_time: 1475ms, lr: 1.3920463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:04,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.42178 samples/s/p 0:26:39 } +2024-07-26 00:47:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 543/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.3906099e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43729 samples/s/p 0:26:31 } +2024-07-26 00:47:10,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 545/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 1.3891744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43593 samples/s/p 0:26:29 } +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 547/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.3877423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.44249 samples/s/p 0:26:24 } +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 549/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3863128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43623 samples/s/p 0:26:23 } +2024-07-26 00:47:19,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 551/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.3848859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:19,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43658 samples/s/p 0:26:20 } +2024-07-26 00:47:22,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 553/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.3834616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43752 samples/s/p 0:26:17 } +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 555/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.3820398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43248 samples/s/p 0:26:15 } +2024-07-26 00:47:28,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 557/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3806199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:28,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43687 samples/s/p 0:26:11 } +2024-07-26 00:47:31,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 559/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.3792041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:31,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43283 samples/s/p 0:26:09 } +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 561/ 1625], loss: 1.045, per_step_time: 1469ms, lr: 1.3777885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44550 samples/s/p 0:26:03 } +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 563/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.3763797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43508 samples/s/p 0:26:03 } +2024-07-26 00:47:40,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 565/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 1.3749693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:40,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43184 samples/s/p 0:26:01 } +2024-07-26 00:47:43,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 567/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 1.3735623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43201 samples/s/p 0:25:58 } +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 569/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 1.3721605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43648 samples/s/p 0:25:53 } +2024-07-26 00:47:48,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 571/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 1.3707577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:48,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43780 samples/s/p 0:25:50 } +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 573/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.3693602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44033 samples/s/p 0:25:46 } +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 575/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 1.3679644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43009 samples/s/p 0:25:46 } +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 577/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 1.3665704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43437 samples/s/p 0:25:42 } +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 579/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.3651814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44053 samples/s/p 0:25:38 } +2024-07-26 00:48:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 581/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.3637925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43486 samples/s/p 0:25:36 } +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 583/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.362408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43732 samples/s/p 0:25:33 } +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 585/ 1625], loss: 0.924, per_step_time: 1469ms, lr: 1.3610252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44382 samples/s/p 0:25:28 } +2024-07-26 00:48:12,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 587/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3596441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43788 samples/s/p 0:25:27 } +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 589/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.3582674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42829 samples/s/p 0:25:26 } +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 591/ 1625], loss: 1.248, per_step_time: 1474ms, lr: 1.3568914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42400 samples/s/p 0:25:25 } +2024-07-26 00:48:21,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 593/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.355519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43749 samples/s/p 0:25:18 } +2024-07-26 00:48:24,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 595/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.35415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:24,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42924 samples/s/p 0:25:17 } +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 597/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.3527826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43257 samples/s/p 0:25:13 } +2024-07-26 00:48:30,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 599/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.3514189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:30,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42724 samples/s/p 0:25:12 } +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 601/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.3500568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43548 samples/s/p 0:25:07 } +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 603/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3486964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43491 samples/s/p 0:25:04 } +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 605/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.3473405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43499 samples/s/p 0:25:01 } +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 607/ 1625], loss: 1.273, per_step_time: 1470ms, lr: 1.3459869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.44090 samples/s/p 0:24:56 } +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 609/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.3446352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43612 samples/s/p 0:24:55 } +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 611/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 1.343287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43207 samples/s/p 0:24:53 } +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 613/ 1625], loss: 1.014, per_step_time: 1469ms, lr: 1.3419404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.44234 samples/s/p 0:24:47 } +2024-07-26 00:48:53,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 615/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.3405966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:53,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43782 samples/s/p 0:24:45 } +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 617/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.3392552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43713 samples/s/p 0:24:43 } +2024-07-26 00:48:59,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 619/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.3379181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:59,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43211 samples/s/p 0:24:41 } +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 621/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3365811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43324 samples/s/p 0:24:38 } +2024-07-26 00:49:05,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 623/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.3352493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:05,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43503 samples/s/p 0:24:34 } +2024-07-26 00:49:08,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 625/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.3339184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:08,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.44137 samples/s/p 0:24:30 } +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 627/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.3325899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43635 samples/s/p 0:24:28 } +2024-07-26 00:49:14,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 629/ 1625], loss: 1.174, per_step_time: 1469ms, lr: 1.331265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:14,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44243 samples/s/p 0:24:24 } +2024-07-26 00:49:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 631/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.3299427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43506 samples/s/p 0:24:23 } +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 633/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.3286221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43494 samples/s/p 0:24:20 } +2024-07-26 00:49:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 635/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.3273041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43742 samples/s/p 0:24:16 } +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 637/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.3259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43897 samples/s/p 0:24:13 } +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 639/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.3246776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44021 samples/s/p 0:24:09 } +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 641/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.3233682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43287 samples/s/p 0:24:08 } +2024-07-26 00:49:35,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 643/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.3220614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.44156 samples/s/p 0:24:03 } +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 645/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.3207564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43333 samples/s/p 0:24:02 } +2024-07-26 00:49:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 647/ 1625], loss: 1.140, per_step_time: 1482ms, lr: 1.319454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.39595 samples/s/p 0:24:09 } +2024-07-26 00:49:43,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 649/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3181567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:43,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43279 samples/s/p 0:23:57 } +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 651/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.3168603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.44146 samples/s/p 0:23:51 } +2024-07-26 00:49:49,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 653/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.3155657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43902 samples/s/p 0:23:49 } +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 655/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.3142752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43396 samples/s/p 0:23:48 } +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 657/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3129866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.42863 samples/s/p 0:23:46 } +2024-07-26 00:49:58,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 659/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3116988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:58,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43183 samples/s/p 0:23:42 } +2024-07-26 00:50:01,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 661/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.3104171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.44084 samples/s/p 0:23:37 } +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 663/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 1.3091354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43683 samples/s/p 0:23:35 } +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 665/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.3078563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43368 samples/s/p 0:23:33 } +2024-07-26 00:50:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 667/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.3065833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43195 samples/s/p 0:23:30 } +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 669/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3053102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:13,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43636 samples/s/p 0:23:26 } +2024-07-26 00:50:16,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 671/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 1.3040398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:16,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43525 samples/s/p 0:23:24 } +2024-07-26 00:50:19,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 673/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.302771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:19,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43779 samples/s/p 0:23:20 } +2024-07-26 00:50:22,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 675/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3015066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43226 samples/s/p 0:23:19 } +2024-07-26 00:50:25,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 677/ 1625], loss: 1.006, per_step_time: 1473ms, lr: 1.3002439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:25,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42902 samples/s/p 0:23:16 } +2024-07-26 00:50:28,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 679/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2989838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:28,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43295 samples/s/p 0:23:12 } +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 681/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.2977271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43705 samples/s/p 0:23:08 } +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 683/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2964713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43519 samples/s/p 0:23:06 } +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 685/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.295219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43685 samples/s/p 0:23:03 } +2024-07-26 00:50:40,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 687/ 1625], loss: 1.003, per_step_time: 1473ms, lr: 1.2939702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:40,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42910 samples/s/p 0:23:02 } +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 689/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.2927239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43343 samples/s/p 0:22:58 } +2024-07-26 00:50:45,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 691/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.2914802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:45,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43620 samples/s/p 0:22:54 } +2024-07-26 00:50:48,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 693/ 1625], loss: 0.969, per_step_time: 1471ms, lr: 1.2902383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43774 samples/s/p 0:22:51 } +2024-07-26 00:50:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 695/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2889989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44033 samples/s/p 0:22:47 } +2024-07-26 00:50:54,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 697/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.2877638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:54,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43815 samples/s/p 0:22:45 } +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 699/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.2865305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43371 samples/s/p 0:22:43 } +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 701/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 1.2852998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44003 samples/s/p 0:22:38 } +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 703/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2840708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43993 samples/s/p 0:22:35 } +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 705/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.2828461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43507 samples/s/p 0:22:34 } +2024-07-26 00:51:09,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 707/ 1625], loss: 1.046, per_step_time: 1469ms, lr: 1.2816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:09,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44258 samples/s/p 0:22:29 } +2024-07-26 00:51:12,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 709/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.2804003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:12,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43135 samples/s/p 0:22:29 } +2024-07-26 00:51:15,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 711/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 1.2791834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:15,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43433 samples/s/p 0:22:25 } +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 713/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.2779674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43345 samples/s/p 0:22:22 } +2024-07-26 00:51:21,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 715/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.2767548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44130 samples/s/p 0:22:17 } +2024-07-26 00:51:24,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 717/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.2755448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:24,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43327 samples/s/p 0:22:16 } +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 719/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2743375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43454 samples/s/p 0:22:13 } +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 721/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.2731327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43669 samples/s/p 0:22:10 } +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 723/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.2719313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43240 samples/s/p 0:22:08 } +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 725/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.2707309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43960 samples/s/p 0:22:03 } +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 727/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.2695356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:39,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43859 samples/s/p 0:22:00 } +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 729/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.2683403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43745 samples/s/p 0:21:58 } +2024-07-26 00:51:44,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 731/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2671485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:44,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43252 samples/s/p 0:21:56 } +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 733/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.2659592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43372 samples/s/p 0:21:53 } +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 735/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 1.2647735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43454 samples/s/p 0:21:50 } +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 737/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.2635894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43451 samples/s/p 0:21:47 } +2024-07-26 00:51:56,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 739/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 1.2624089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43314 samples/s/p 0:21:44 } +2024-07-26 00:51:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 741/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.26123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:59,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43341 samples/s/p 0:21:41 } +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 743/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.2600555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.42634 samples/s/p 0:21:40 } +2024-07-26 00:52:05,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 745/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.258881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:05,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43753 samples/s/p 0:21:34 } +2024-07-26 00:52:08,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 747/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.2577107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:08,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43463 samples/s/p 0:21:32 } +2024-07-26 00:52:11,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 749/ 1625], loss: 1.090, per_step_time: 1480ms, lr: 1.2565431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.40228 samples/s/p 0:21:37 } +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 751/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.255378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43762 samples/s/p 0:21:25 } +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 753/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2542147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43691 samples/s/p 0:21:23 } +2024-07-26 00:52:20,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 755/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 1.2530548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:20,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43720 samples/s/p 0:21:20 } +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 757/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.2518976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.44002 samples/s/p 0:21:16 } +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 759/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.250743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43413 samples/s/p 0:21:14 } +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 761/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.2495917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43124 samples/s/p 0:21:12 } +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 763/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.2484405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43318 samples/s/p 0:21:09 } +2024-07-26 00:52:35,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 765/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.2472946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:35,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43892 samples/s/p 0:21:04 } +2024-07-26 00:52:38,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 767/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 1.2461494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:38,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43821 samples/s/p 0:21:02 } +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 769/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.2450085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.44066 samples/s/p 0:20:58 } +2024-07-26 00:52:44,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 771/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.2438694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:44,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43447 samples/s/p 0:20:57 } +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 773/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.2427329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43454 samples/s/p 0:20:54 } +2024-07-26 00:52:49,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 775/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.2415982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.44136 samples/s/p 0:20:49 } +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:53:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 777/ 1625], loss: 1.305, per_step_time: 2533ms, lr: 1.2404677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:25,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 3.15761 samples/s/p 0:35:48 } +2024-07-26 00:53:28,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 779/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.2393398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43407 samples/s/p 0:20:45 } +2024-07-26 00:53:31,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 781/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.2382137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43263 samples/s/p 0:20:42 } +2024-07-26 00:53:34,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 783/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.2370901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:34,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43651 samples/s/p 0:20:39 } +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 785/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.2359692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43709 samples/s/p 0:20:35 } +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 787/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.2348517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43458 samples/s/p 0:20:33 } +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 789/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.2337359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42970 samples/s/p 0:20:31 } +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 791/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2326236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43490 samples/s/p 0:20:27 } +2024-07-26 00:53:49,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 793/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.2315139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:49,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43738 samples/s/p 0:20:24 } +2024-07-26 00:53:52,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 795/ 1625], loss: 1.404, per_step_time: 1470ms, lr: 1.2304059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43948 samples/s/p 0:20:20 } +2024-07-26 00:53:55,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 797/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.2293013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:55,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43934 samples/s/p 0:20:17 } +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 799/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.2281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43903 samples/s/p 0:20:14 } +2024-07-26 00:54:01,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 801/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.2271009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:01,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43635 samples/s/p 0:20:12 } +2024-07-26 00:54:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 803/ 1625], loss: 1.184, per_step_time: 1474ms, lr: 1.2260016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:04,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42379 samples/s/p 0:20:12 } +2024-07-26 00:54:07,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 805/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.2249092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:07,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44193 samples/s/p 0:20:05 } +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 807/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.2238168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43364 samples/s/p 0:20:04 } +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 809/ 1625], loss: 1.378, per_step_time: 1470ms, lr: 1.2227285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44011 samples/s/p 0:19:59 } +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 811/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 1.2216414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43527 samples/s/p 0:19:58 } +2024-07-26 00:54:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 813/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2205584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:19,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43589 samples/s/p 0:19:55 } +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 815/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2194764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43728 samples/s/p 0:19:51 } +2024-07-26 00:54:24,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 817/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.2183987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44071 samples/s/p 0:19:48 } +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 819/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.2173217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43604 samples/s/p 0:19:46 } +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 821/ 1625], loss: 1.135, per_step_time: 1469ms, lr: 1.2162501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.44439 samples/s/p 0:19:41 } +2024-07-26 00:54:33,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.2151784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42945 samples/s/p 0:19:41 } +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 825/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.214111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43087 samples/s/p 0:19:38 } +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 827/ 1625], loss: 1.006, per_step_time: 1475ms, lr: 1.2130454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42200 samples/s/p 0:19:37 } +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 829/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.2119832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43950 samples/s/p 0:19:30 } +2024-07-26 00:54:45,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 831/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.2109227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:45,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43271 samples/s/p 0:19:29 } +2024-07-26 00:54:48,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 833/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.2098657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:48,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43101 samples/s/p 0:19:26 } +2024-07-26 00:54:51,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 835/ 1625], loss: 0.949, per_step_time: 1475ms, lr: 1.2088104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:51,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42212 samples/s/p 0:19:25 } +2024-07-26 00:54:54,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 837/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.2077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.42970 samples/s/p 0:19:21 } +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 839/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.2067094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43451 samples/s/p 0:19:17 } +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 841/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2056628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43997 samples/s/p 0:19:12 } +2024-07-26 00:55:03,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 843/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.2046196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:03,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43593 samples/s/p 0:19:10 } +2024-07-26 00:55:06,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 845/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2035764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43206 samples/s/p 0:19:08 } +2024-07-26 00:55:09,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 847/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.2025375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:09,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43182 samples/s/p 0:19:05 } +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 849/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.2015031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43394 samples/s/p 0:19:02 } +2024-07-26 00:55:15,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 851/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.2004693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43934 samples/s/p 0:18:58 } +2024-07-26 00:55:18,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 853/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 1.1994383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:18,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43392 samples/s/p 0:18:56 } +2024-07-26 00:55:20,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 855/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.198409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:20,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43844 samples/s/p 0:18:52 } +2024-07-26 00:55:23,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 857/ 1625], loss: 1.175, per_step_time: 1475ms, lr: 1.1973831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42263 samples/s/p 0:18:53 } +2024-07-26 00:55:26,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 859/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.1963607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:26,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42994 samples/s/p 0:18:48 } +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 861/ 1625], loss: 1.147, per_step_time: 1476ms, lr: 1.1953391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.41991 samples/s/p 0:18:47 } +2024-07-26 00:55:32,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 863/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.1943227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.44046 samples/s/p 0:18:40 } +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 865/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.1933064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43560 samples/s/p 0:18:38 } +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 867/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.1922943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43496 samples/s/p 0:18:35 } +2024-07-26 00:55:41,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 869/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.1912848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:41,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43020 samples/s/p 0:18:33 } +2024-07-26 00:55:44,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 871/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1902771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:44,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.42904 samples/s/p 0:18:31 } +2024-07-26 00:55:47,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 873/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1892737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:47,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43465 samples/s/p 0:18:26 } +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 875/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.188272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43191 samples/s/p 0:18:24 } +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 877/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.1872712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43121 samples/s/p 0:18:21 } +2024-07-26 00:55:56,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 879/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.1862755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43119 samples/s/p 0:18:18 } +2024-07-26 00:55:59,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 881/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.1852799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:59,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43339 samples/s/p 0:18:15 } +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 883/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.1842894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43361 samples/s/p 0:18:12 } +2024-07-26 00:56:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 885/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 1.1833007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:05,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43317 samples/s/p 0:18:09 } +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 887/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.1823155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43951 samples/s/p 0:18:05 } +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 889/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 1.181332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:11,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42637 samples/s/p 0:18:05 } +2024-07-26 00:56:14,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 891/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.180351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:14,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43774 samples/s/p 0:17:59 } +2024-07-26 00:56:17,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 893/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 1.1793726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:17,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43403 samples/s/p 0:17:57 } +2024-07-26 00:56:20,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 895/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 1.178396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:20,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42812 samples/s/p 0:17:55 } +2024-07-26 00:56:23,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 897/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1774246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43578 samples/s/p 0:17:51 } +2024-07-26 00:56:25,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 899/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.1764548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43067 samples/s/p 0:17:49 } +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 901/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1754878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43777 samples/s/p 0:17:45 } +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 903/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.1745224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43326 samples/s/p 0:17:43 } +2024-07-26 00:56:34,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 905/ 1625], loss: 0.961, per_step_time: 1473ms, lr: 1.1735588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:34,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42791 samples/s/p 0:17:41 } +2024-07-26 00:56:37,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 907/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 1.1726003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:37,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43388 samples/s/p 0:17:37 } +2024-07-26 00:56:40,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 909/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.1716427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42809 samples/s/p 0:17:35 } +2024-07-26 00:56:43,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 911/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1706876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:43,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43019 samples/s/p 0:17:31 } +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 913/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.169736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43120 samples/s/p 0:17:28 } +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 915/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.168788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.44154 samples/s/p 0:17:23 } +2024-07-26 00:56:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 917/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.1678408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43579 samples/s/p 0:17:21 } +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 919/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 1.1668986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43192 samples/s/p 0:17:19 } +2024-07-26 00:56:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 921/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.1659566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43534 samples/s/p 0:17:16 } +2024-07-26 00:57:01,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 923/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 1.1650188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.44000 samples/s/p 0:17:12 } +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 925/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1640828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43254 samples/s/p 0:17:10 } +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 927/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.1631478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43887 samples/s/p 0:17:06 } +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 929/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.1622195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43209 samples/s/p 0:17:05 } +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 931/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.1612905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43207 samples/s/p 0:17:02 } +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 933/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.1603656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43108 samples/s/p 0:16:59 } +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 935/ 1625], loss: 1.391, per_step_time: 1475ms, lr: 1.1594426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42324 samples/s/p 0:16:57 } +2024-07-26 00:57:22,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 937/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1585222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43574 samples/s/p 0:16:52 } +2024-07-26 00:57:24,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 939/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 1.1576052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43607 samples/s/p 0:16:49 } +2024-07-26 00:57:27,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 941/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.1566899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:27,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43485 samples/s/p 0:16:46 } +2024-07-26 00:57:30,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 943/ 1625], loss: 1.395, per_step_time: 1472ms, lr: 1.1557781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:30,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43269 samples/s/p 0:16:44 } +2024-07-26 00:57:33,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 945/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.1548681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:33,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42986 samples/s/p 0:16:41 } +2024-07-26 00:57:36,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 947/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.1539623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42812 samples/s/p 0:16:39 } +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 949/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.1530583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43940 samples/s/p 0:16:34 } +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 951/ 1625], loss: 1.334, per_step_time: 1473ms, lr: 1.1521586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.42800 samples/s/p 0:16:33 } +2024-07-26 00:57:45,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 953/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.1512581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43325 samples/s/p 0:16:29 } +2024-07-26 00:57:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 955/ 1625], loss: 1.356, per_step_time: 1469ms, lr: 1.1503627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:48,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.44245 samples/s/p 0:16:24 } +2024-07-26 00:57:51,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 957/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.1494699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:51,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43382 samples/s/p 0:16:23 } +2024-07-26 00:57:54,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 959/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.1485771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:54,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43624 samples/s/p 0:16:20 } +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 961/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.1476903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43007 samples/s/p 0:16:18 } +2024-07-26 00:58:00,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 963/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.1468053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:00,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43735 samples/s/p 0:16:14 } +2024-07-26 00:58:03,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 965/ 1625], loss: 0.989, per_step_time: 1471ms, lr: 1.1459211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:03,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43488 samples/s/p 0:16:11 } +2024-07-26 00:58:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 967/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 1.1450413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43025 samples/s/p 0:16:09 } +2024-07-26 00:58:09,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 969/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.1441632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:09,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43849 samples/s/p 0:16:04 } +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 971/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 1.1432877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43382 samples/s/p 0:16:02 } +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 973/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 1.1424165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43464 samples/s/p 0:15:59 } +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 975/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 1.1415462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44027 samples/s/p 0:15:55 } +2024-07-26 00:58:21,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 977/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1406785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43284 samples/s/p 0:15:54 } +2024-07-26 00:58:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 979/ 1625], loss: 1.317, per_step_time: 1470ms, lr: 1.1398151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:24,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44145 samples/s/p 0:15:49 } +2024-07-26 00:58:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 981/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 1.1389534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:26,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43778 samples/s/p 0:15:47 } +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 983/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1380953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43371 samples/s/p 0:15:45 } +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 985/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1372379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43792 samples/s/p 0:15:41 } +2024-07-26 00:58:35,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 987/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.1363849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43381 samples/s/p 0:15:39 } +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 989/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1355327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43401 samples/s/p 0:15:36 } +2024-07-26 00:58:41,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 991/ 1625], loss: 1.498, per_step_time: 1470ms, lr: 1.1346857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:41,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43943 samples/s/p 0:15:32 } +2024-07-26 00:58:44,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 993/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.1338395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.44165 samples/s/p 0:15:29 } +2024-07-26 00:58:47,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 995/ 1625], loss: 1.396, per_step_time: 1470ms, lr: 1.1329969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43863 samples/s/p 0:15:26 } +2024-07-26 00:58:50,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 997/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.1321551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:50,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43445 samples/s/p 0:15:24 } +2024-07-26 00:58:53,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 999/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.1313176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43847 samples/s/p 0:15:20 } +2024-07-26 00:58:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1001/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.1304828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42749 samples/s/p 0:15:19 } +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1003/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1296487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:59,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43500 samples/s/p 0:15:15 } +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1005/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.1288207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43605 samples/s/p 0:15:12 } +2024-07-26 00:59:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1007/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.1279928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:05,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43490 samples/s/p 0:15:09 } +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1009/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.1271692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43775 samples/s/p 0:15:06 } +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1011/ 1625], loss: 1.373, per_step_time: 1474ms, lr: 1.1263472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42516 samples/s/p 0:15:05 } +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1013/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.1255271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43360 samples/s/p 0:15:01 } +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1015/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.1247112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43484 samples/s/p 0:14:57 } +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1017/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.1238961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44007 samples/s/p 0:14:54 } +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1019/ 1625], loss: 0.968, per_step_time: 1470ms, lr: 1.1230854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43898 samples/s/p 0:14:51 } +2024-07-26 00:59:25,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1021/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.1222766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:25,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42761 samples/s/p 0:14:50 } +2024-07-26 00:59:28,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1023/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.1214719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42877 samples/s/p 0:14:47 } +2024-07-26 00:59:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1025/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.1206673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44031 samples/s/p 0:14:42 } +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1027/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.119867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43556 samples/s/p 0:14:40 } +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1029/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.1190692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43480 samples/s/p 0:14:37 } +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1031/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.1182733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44020 samples/s/p 0:14:33 } +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1033/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.1174816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43464 samples/s/p 0:14:31 } +2024-07-26 00:59:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1035/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 1.1166908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44534 samples/s/p 0:14:26 } +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1037/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 1.1159034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44084 samples/s/p 0:14:24 } +2024-07-26 00:59:52,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1039/ 1625], loss: 0.982, per_step_time: 1469ms, lr: 1.1151195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:52,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44285 samples/s/p 0:14:21 } +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1041/ 1625], loss: 0.996, per_step_time: 1470ms, lr: 1.1143366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44062 samples/s/p 0:14:18 } +2024-07-26 00:59:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1043/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.1135578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:58,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43058 samples/s/p 0:14:17 } +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1045/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.11278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.42582 samples/s/p 0:14:15 } +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1047/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.1120056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43422 samples/s/p 0:14:10 } +2024-07-26 01:00:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1049/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.1112346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:07,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.44043 samples/s/p 0:14:06 } +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1051/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 1.1104663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43262 samples/s/p 0:14:05 } +2024-07-26 01:00:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1053/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.1096997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:13,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43569 samples/s/p 0:14:01 } +2024-07-26 01:00:16,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1055/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.1089375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43268 samples/s/p 0:13:59 } +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1057/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.108176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43563 samples/s/p 0:13:55 } +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1059/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.1074172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.42599 samples/s/p 0:13:54 } +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1061/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1066627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43594 samples/s/p 0:13:50 } +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1063/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 1.1059082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43350 samples/s/p 0:13:47 } +2024-07-26 01:00:30,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1065/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.1051579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:30,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42954 samples/s/p 0:13:45 } +2024-07-26 01:00:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1067/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.1044121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42942 samples/s/p 0:13:42 } +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1069/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.1036655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43548 samples/s/p 0:13:38 } +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1071/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.1029247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43453 samples/s/p 0:13:35 } +2024-07-26 01:00:42,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1073/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.1021832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:42,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42853 samples/s/p 0:13:33 } +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1075/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 1.1014486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43052 samples/s/p 0:13:30 } +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1077/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.1007139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43426 samples/s/p 0:13:26 } +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1079/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0999811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43485 samples/s/p 0:13:23 } +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1081/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.0992525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43743 samples/s/p 0:13:20 } +2024-07-26 01:00:57,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1083/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.0985265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43202 samples/s/p 0:13:18 } +2024-07-26 01:01:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1085/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.0978031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43847 samples/s/p 0:13:14 } +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1087/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43713 samples/s/p 0:13:11 } +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1089/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.0963632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43306 samples/s/p 0:13:09 } +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1091/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.0956476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43849 samples/s/p 0:13:05 } +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1093/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.0949345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43353 samples/s/p 0:13:03 } +2024-07-26 01:01:15,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1095/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.094225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43185 samples/s/p 0:13:00 } +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1097/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0935163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43353 samples/s/p 0:12:57 } +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1099/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 1.0928111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:21,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43587 samples/s/p 0:12:54 } +2024-07-26 01:01:24,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1101/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 1.0921093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:24,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43621 samples/s/p 0:12:51 } +2024-07-26 01:01:26,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1103/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.0914084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:26,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43805 samples/s/p 0:12:47 } +2024-07-26 01:01:29,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.0907135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43785 samples/s/p 0:12:45 } +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1107/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.0900178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43996 samples/s/p 0:12:41 } +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1109/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 1.0893273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43986 samples/s/p 0:12:38 } +2024-07-26 01:01:38,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1111/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0886375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:38,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43445 samples/s/p 0:12:36 } +2024-07-26 01:01:41,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1113/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0879496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44153 samples/s/p 0:12:32 } +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1115/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0872668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43806 samples/s/p 0:12:30 } +2024-07-26 01:01:47,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1117/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0865875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:47,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43679 samples/s/p 0:12:27 } +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1119/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 1.0859081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43183 samples/s/p 0:12:25 } +2024-07-26 01:01:53,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1121/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.0852315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.44157 samples/s/p 0:12:20 } +2024-07-26 01:01:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1123/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.084559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43442 samples/s/p 0:12:18 } +2024-07-26 01:01:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1125/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.0838884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:59,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43144 samples/s/p 0:12:16 } +2024-07-26 01:02:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1127/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.0832194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:02,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43620 samples/s/p 0:12:12 } +2024-07-26 01:02:05,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1129/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0825556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:05,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43489 samples/s/p 0:12:10 } +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1131/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.0818919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43536 samples/s/p 0:12:07 } +2024-07-26 01:02:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1133/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 1.0812325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43375 samples/s/p 0:12:04 } +2024-07-26 01:02:14,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1135/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.0805747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43994 samples/s/p 0:12:00 } +2024-07-26 01:02:17,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1137/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.0799223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43827 samples/s/p 0:11:57 } +2024-07-26 01:02:20,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1139/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.0792688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43418 samples/s/p 0:11:55 } +2024-07-26 01:02:23,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1141/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.0786198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:23,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43714 samples/s/p 0:11:52 } +2024-07-26 01:02:25,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1143/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.0779751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43413 samples/s/p 0:11:49 } +2024-07-26 01:02:28,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1145/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.0773304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43814 samples/s/p 0:11:46 } +2024-07-26 01:02:31,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1147/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.076689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:31,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43722 samples/s/p 0:11:43 } +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1149/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.0760511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43534 samples/s/p 0:11:40 } +2024-07-26 01:02:37,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1151/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.0754143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:37,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43349 samples/s/p 0:11:37 } +2024-07-26 01:02:40,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1153/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.0747824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43982 samples/s/p 0:11:34 } +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1155/ 1625], loss: 1.252, per_step_time: 1469ms, lr: 1.0741506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.44302 samples/s/p 0:11:30 } +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1157/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 1.0735232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43445 samples/s/p 0:11:28 } +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1159/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0728984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43564 samples/s/p 0:11:25 } +2024-07-26 01:02:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1161/ 1625], loss: 0.912, per_step_time: 1471ms, lr: 1.0722744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43578 samples/s/p 0:11:22 } +2024-07-26 01:02:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1163/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.0716547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43617 samples/s/p 0:11:19 } +2024-07-26 01:02:58,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1165/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.0710376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:58,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.42897 samples/s/p 0:11:17 } +2024-07-26 01:03:01,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1167/ 1625], loss: 1.370, per_step_time: 1473ms, lr: 1.070424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.42982 samples/s/p 0:11:14 } +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1169/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.0698112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:04,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43708 samples/s/p 0:11:10 } +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1171/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 1.0692028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43908 samples/s/p 0:11:07 } +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1173/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.0685951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43252 samples/s/p 0:11:05 } +2024-07-26 01:03:13,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1175/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0679919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43600 samples/s/p 0:11:02 } +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1177/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.0673913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43623 samples/s/p 0:10:59 } +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1179/ 1625], loss: 1.011, per_step_time: 1473ms, lr: 1.0667932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43099 samples/s/p 0:10:56 } +2024-07-26 01:03:22,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1181/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0661968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:22,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43532 samples/s/p 0:10:53 } +2024-07-26 01:03:24,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1183/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.0656022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43983 samples/s/p 0:10:50 } +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1185/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.0650127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42951 samples/s/p 0:10:48 } +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1187/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.0644251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43106 samples/s/p 0:10:45 } +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1189/ 1625], loss: 1.031, per_step_time: 1474ms, lr: 1.0638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42667 samples/s/p 0:10:42 } +2024-07-26 01:03:36,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1191/ 1625], loss: 0.941, per_step_time: 1473ms, lr: 1.0632566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:36,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42913 samples/s/p 0:10:39 } +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1193/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.0626775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43795 samples/s/p 0:10:35 } +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1195/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.0621011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43337 samples/s/p 0:10:33 } +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1197/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 1.0615246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.44022 samples/s/p 0:10:29 } +2024-07-26 01:03:48,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1199/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 1.0609533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:48,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43034 samples/s/p 0:10:27 } +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1201/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.0603829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43147 samples/s/p 0:10:24 } +2024-07-26 01:03:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1203/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0598177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:54,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43436 samples/s/p 0:10:21 } +2024-07-26 01:03:57,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1205/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.0592541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43585 samples/s/p 0:10:18 } +2024-07-26 01:04:00,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1207/ 1625], loss: 0.954, per_step_time: 1471ms, lr: 1.0586924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43484 samples/s/p 0:10:15 } +2024-07-26 01:04:03,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1209/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0581332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43796 samples/s/p 0:10:11 } +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1211/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0575784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42998 samples/s/p 0:10:09 } +2024-07-26 01:04:09,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1213/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.0570244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43352 samples/s/p 0:10:06 } +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1215/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 1.0564738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43768 samples/s/p 0:10:03 } +2024-07-26 01:04:15,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1217/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.0559268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42998 samples/s/p 0:10:01 } +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1219/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 1.0553805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42956 samples/s/p 0:09:58 } +2024-07-26 01:04:21,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1221/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0548387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43210 samples/s/p 0:09:54 } +2024-07-26 01:04:24,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1223/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.0542967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:24,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.44103 samples/s/p 0:09:51 } +2024-07-26 01:04:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1225/ 1625], loss: 1.046, per_step_time: 1472ms, lr: 1.0537617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43407 samples/s/p 0:09:48 } +2024-07-26 01:04:29,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1227/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0532268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43768 samples/s/p 0:09:45 } +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1229/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0526935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43676 samples/s/p 0:09:42 } +2024-07-26 01:04:35,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1231/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.0521646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43341 samples/s/p 0:09:40 } +2024-07-26 01:04:38,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1233/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0516374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:38,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43163 samples/s/p 0:09:37 } +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1235/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.0511145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43295 samples/s/p 0:09:34 } +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1237/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.0505934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.44176 samples/s/p 0:09:30 } +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1239/ 1625], loss: 1.200, per_step_time: 1475ms, lr: 1.0500747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.42170 samples/s/p 0:09:29 } +2024-07-26 01:04:50,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1241/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.0495597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43316 samples/s/p 0:09:25 } +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1243/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.0490463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43733 samples/s/p 0:09:22 } +2024-07-26 01:04:56,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1245/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 1.0485355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44127 samples/s/p 0:09:18 } +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1247/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 1.0480273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43441 samples/s/p 0:09:16 } +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1249/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.0475218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43255 samples/s/p 0:09:13 } +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1251/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 1.0470196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43484 samples/s/p 0:09:10 } +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1253/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.0465192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43612 samples/s/p 0:09:07 } +2024-07-26 01:05:11,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1255/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.0460213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.42652 samples/s/p 0:09:05 } +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1257/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 1.0455278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44106 samples/s/p 0:09:01 } +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1259/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0450344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43759 samples/s/p 0:08:58 } +2024-07-26 01:05:20,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.044546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:20,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43730 samples/s/p 0:08:55 } +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1263/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.0440604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43162 samples/s/p 0:08:53 } +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1265/ 1625], loss: 0.953, per_step_time: 1471ms, lr: 1.0435755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43705 samples/s/p 0:08:49 } +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1267/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.0430958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.44022 samples/s/p 0:08:46 } +2024-07-26 01:05:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1269/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 1.0426162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43863 samples/s/p 0:08:43 } +2024-07-26 01:05:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1271/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.042139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:34,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43724 samples/s/p 0:08:40 } +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1273/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.0416654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43142 samples/s/p 0:08:38 } +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1275/ 1625], loss: 0.948, per_step_time: 1470ms, lr: 1.0411961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43996 samples/s/p 0:08:34 } +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1277/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.0407277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44154 samples/s/p 0:08:31 } +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1279/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.0402645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43073 samples/s/p 0:08:29 } +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1281/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.0398012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44010 samples/s/p 0:08:25 } +2024-07-26 01:05:52,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1283/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.0393405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:52,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43409 samples/s/p 0:08:23 } +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1285/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0388834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43262 samples/s/p 0:08:20 } +2024-07-26 01:05:58,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1287/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0384288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:58,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43325 samples/s/p 0:08:17 } +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1289/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.0379767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43329 samples/s/p 0:08:14 } +2024-07-26 01:06:04,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1291/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.0375273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43530 samples/s/p 0:08:11 } +2024-07-26 01:06:07,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1293/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.0370796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:07,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.42753 samples/s/p 0:08:09 } +2024-07-26 01:06:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1295/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0366372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43388 samples/s/p 0:08:05 } +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1297/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.0361964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43536 samples/s/p 0:08:02 } +2024-07-26 01:06:16,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1299/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0357581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:16,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43783 samples/s/p 0:07:59 } +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1301/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.0353217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43758 samples/s/p 0:07:56 } +2024-07-26 01:06:22,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1303/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.034887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43650 samples/s/p 0:07:53 } +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1305/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.0344575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.44021 samples/s/p 0:07:50 } +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1307/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.0340297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43345 samples/s/p 0:07:48 } +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1309/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0336053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43051 samples/s/p 0:07:45 } +2024-07-26 01:06:33,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1311/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.0331818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:33,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43431 samples/s/p 0:07:42 } +2024-07-26 01:06:36,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1313/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.0327626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:36,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43070 samples/s/p 0:07:39 } +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1315/ 1625], loss: 1.175, per_step_time: 1469ms, lr: 1.0323444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44291 samples/s/p 0:07:35 } +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1317/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.0319303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44204 samples/s/p 0:07:32 } +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1319/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0315181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43463 samples/s/p 0:07:30 } +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1321/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.0311085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44204 samples/s/p 0:07:26 } +2024-07-26 01:06:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1323/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.0307023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43580 samples/s/p 0:07:24 } +2024-07-26 01:06:54,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1325/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.0302995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43216 samples/s/p 0:07:21 } +2024-07-26 01:06:57,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1327/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0298976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43624 samples/s/p 0:07:18 } +2024-07-26 01:07:00,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1329/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43842 samples/s/p 0:07:15 } +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1331/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0291034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43219 samples/s/p 0:07:12 } +2024-07-26 01:07:06,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1333/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.0287101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43325 samples/s/p 0:07:09 } +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1335/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.0283194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43227 samples/s/p 0:07:07 } +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1337/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.0279323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43277 samples/s/p 0:07:04 } +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1339/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.0275477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43708 samples/s/p 0:07:00 } +2024-07-26 01:07:18,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1341/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.0271639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42749 samples/s/p 0:06:58 } +2024-07-26 01:07:21,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1343/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0267854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43160 samples/s/p 0:06:55 } +2024-07-26 01:07:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1345/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.0264085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43249 samples/s/p 0:06:52 } +2024-07-26 01:07:26,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1347/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.0260335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.44010 samples/s/p 0:06:48 } +2024-07-26 01:07:29,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1349/ 1625], loss: 1.021, per_step_time: 1473ms, lr: 1.0256618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42890 samples/s/p 0:06:46 } +2024-07-26 01:07:32,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1351/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 1.025291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43066 samples/s/p 0:06:43 } +2024-07-26 01:07:35,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1353/ 1625], loss: 1.098, per_step_time: 1479ms, lr: 1.0249263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.40735 samples/s/p 0:06:42 } +2024-07-26 01:07:38,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1355/ 1625], loss: 1.032, per_step_time: 1474ms, lr: 1.0245616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:38,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42733 samples/s/p 0:06:37 } +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1357/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0242012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43168 samples/s/p 0:06:34 } +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1359/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.0238425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43475 samples/s/p 0:06:31 } +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1361/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0234857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43977 samples/s/p 0:06:28 } +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1363/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.023133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43256 samples/s/p 0:06:25 } +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1365/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.022783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43763 samples/s/p 0:06:22 } +2024-07-26 01:07:56,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1367/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0224346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:56,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43251 samples/s/p 0:06:19 } +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1369/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0220889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43343 samples/s/p 0:06:16 } +2024-07-26 01:08:02,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1371/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.0217484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43934 samples/s/p 0:06:13 } +2024-07-26 01:08:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1373/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0214079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43350 samples/s/p 0:06:11 } +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1375/ 1625], loss: 1.065, per_step_time: 1469ms, lr: 1.0210725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:08,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44226 samples/s/p 0:06:07 } +2024-07-26 01:08:11,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1377/ 1625], loss: 0.925, per_step_time: 1469ms, lr: 1.0207364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44220 samples/s/p 0:06:04 } +2024-07-26 01:08:14,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1379/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 1.0204053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43467 samples/s/p 0:06:02 } +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1381/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.0200761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42831 samples/s/p 0:05:59 } +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1383/ 1625], loss: 1.464, per_step_time: 1473ms, lr: 1.0197493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42769 samples/s/p 0:05:56 } +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1385/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 1.0194253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43802 samples/s/p 0:05:53 } +2024-07-26 01:08:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1387/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 1.0191037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43205 samples/s/p 0:05:50 } +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1389/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.0187874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42954 samples/s/p 0:05:47 } +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1391/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.0184702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44161 samples/s/p 0:05:44 } +2024-07-26 01:08:34,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1393/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 1.0181583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.42981 samples/s/p 0:05:41 } +2024-07-26 01:08:37,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1395/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.017848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:37,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44084 samples/s/p 0:05:38 } +2024-07-26 01:08:40,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1397/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0175395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43568 samples/s/p 0:05:35 } +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1399/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.0172334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43671 samples/s/p 0:05:32 } +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1401/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0169335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43274 samples/s/p 0:05:29 } +2024-07-26 01:08:49,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1403/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0166336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43503 samples/s/p 0:05:26 } +2024-07-26 01:08:52,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1405/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 1.0163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43460 samples/s/p 0:05:23 } +2024-07-26 01:08:55,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1407/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.0160417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43825 samples/s/p 0:05:20 } +2024-07-26 01:08:58,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1409/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.0157504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43814 samples/s/p 0:05:17 } +2024-07-26 01:09:01,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1411/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0154608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:01,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43509 samples/s/p 0:05:14 } +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1413/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.0151748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43137 samples/s/p 0:05:12 } +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1415/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0148922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43530 samples/s/p 0:05:09 } +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1417/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 1.0146105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.42499 samples/s/p 0:05:06 } +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1419/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.0143322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43620 samples/s/p 0:05:03 } +2024-07-26 01:09:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1421/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.0140565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.44044 samples/s/p 0:04:59 } +2024-07-26 01:09:19,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1423/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 1.0137842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:19,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44106 samples/s/p 0:04:57 } +2024-07-26 01:09:22,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1425/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.0135137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44448 samples/s/p 0:04:53 } +2024-07-26 01:09:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1427/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0132458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43538 samples/s/p 0:04:51 } +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1429/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0129821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43558 samples/s/p 0:04:48 } +2024-07-26 01:09:30,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1431/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.0127186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43031 samples/s/p 0:04:45 } +2024-07-26 01:09:33,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1433/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 1.0124593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44129 samples/s/p 0:04:42 } +2024-07-26 01:09:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1435/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0122026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43816 samples/s/p 0:04:39 } +2024-07-26 01:09:39,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1437/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.0119476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43641 samples/s/p 0:04:36 } +2024-07-26 01:09:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1439/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.0116961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43026 samples/s/p 0:04:34 } +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1441/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 1.0114472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43702 samples/s/p 0:04:30 } +2024-07-26 01:09:48,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1443/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.0112018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:48,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43588 samples/s/p 0:04:27 } +2024-07-26 01:09:51,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1445/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.010958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43412 samples/s/p 0:04:24 } +2024-07-26 01:09:54,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.0107178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43639 samples/s/p 0:04:21 } +2024-07-26 01:09:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1449/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0104792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43119 samples/s/p 0:04:19 } +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1451/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0102442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43178 samples/s/p 0:04:16 } +2024-07-26 01:10:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1453/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0100108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:03,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43552 samples/s/p 0:04:13 } +2024-07-26 01:10:06,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1455/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.0097809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43944 samples/s/p 0:04:10 } +2024-07-26 01:10:09,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1457/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 1.0095536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43437 samples/s/p 0:04:07 } +2024-07-26 01:10:12,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1459/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.0093289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:12,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43159 samples/s/p 0:04:04 } +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1461/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.0091077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43850 samples/s/p 0:04:01 } +2024-07-26 01:10:18,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1463/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.0088872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:18,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43405 samples/s/p 0:03:58 } +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1465/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.008672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43533 samples/s/p 0:03:55 } +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1467/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.008456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43259 samples/s/p 0:03:52 } +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1469/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 1.0082451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.44373 samples/s/p 0:03:49 } +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1471/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.0080369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43244 samples/s/p 0:03:46 } +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1473/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.0078303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43485 samples/s/p 0:03:43 } +2024-07-26 01:10:35,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1475/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 1.007628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.44025 samples/s/p 0:03:40 } +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1477/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.0074266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43870 samples/s/p 0:03:37 } +2024-07-26 01:10:41,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1479/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0072288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43138 samples/s/p 0:03:35 } +2024-07-26 01:10:44,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1481/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.0070335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43137 samples/s/p 0:03:32 } +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1483/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 1.0068399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43095 samples/s/p 0:03:29 } +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1485/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.0066514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43279 samples/s/p 0:03:26 } +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1487/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 1.0064639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43125 samples/s/p 0:03:23 } +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1489/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.0062789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.44058 samples/s/p 0:03:19 } +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1491/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0060966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43774 samples/s/p 0:03:17 } +2024-07-26 01:11:02,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1493/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.0059176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:02,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.44106 samples/s/p 0:03:14 } +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1495/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.0057405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43144 samples/s/p 0:03:11 } +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1497/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 1.0055668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43634 samples/s/p 0:03:08 } +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1499/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.0053948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43420 samples/s/p 0:03:05 } +2024-07-26 01:11:14,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1501/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0052271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43889 samples/s/p 0:03:02 } +2024-07-26 01:11:17,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1503/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 1.0050603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:17,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.42548 samples/s/p 0:02:59 } +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1505/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 1.0048986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42709 samples/s/p 0:02:56 } +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1507/ 1625], loss: 1.339, per_step_time: 1472ms, lr: 1.0047371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43442 samples/s/p 0:02:53 } +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1509/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.0045788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42878 samples/s/p 0:02:50 } +2024-07-26 01:11:28,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1511/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0044242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43564 samples/s/p 0:02:47 } +2024-07-26 01:11:31,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1513/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.0042712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:31,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.44037 samples/s/p 0:02:44 } +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1515/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.00412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43734 samples/s/p 0:02:41 } +2024-07-26 01:11:37,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1517/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.0039756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:37,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43739 samples/s/p 0:02:38 } +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1519/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0038295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43720 samples/s/p 0:02:35 } +2024-07-26 01:11:43,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1521/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 1.0036896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43849 samples/s/p 0:02:32 } +2024-07-26 01:11:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1523/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.0035478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:46,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.44037 samples/s/p 0:02:29 } +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1525/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.0034121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43373 samples/s/p 0:02:27 } +2024-07-26 01:11:52,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1527/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.0032782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:52,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43352 samples/s/p 0:02:24 } +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1529/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.0031486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43542 samples/s/p 0:02:21 } +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1531/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.0030188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43716 samples/s/p 0:02:18 } +2024-07-26 01:12:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1533/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0028936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43505 samples/s/p 0:02:15 } +2024-07-26 01:12:04,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1535/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 1.0027709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:04,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43393 samples/s/p 0:02:12 } +2024-07-26 01:12:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1537/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 1.0026498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:07,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42329 samples/s/p 0:02:09 } +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1539/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.0025315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43796 samples/s/p 0:02:06 } +2024-07-26 01:12:13,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1541/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.0024182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:13,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43718 samples/s/p 0:02:03 } +2024-07-26 01:12:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1543/ 1625], loss: 1.210, per_step_time: 1475ms, lr: 1.0023033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:16,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42182 samples/s/p 0:02:00 } +2024-07-26 01:12:19,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1545/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0021944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:19,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43536 samples/s/p 0:01:57 } +2024-07-26 01:12:22,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1547/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.0020872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:22,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43276 samples/s/p 0:01:54 } +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1549/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.0019844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43377 samples/s/p 0:01:51 } +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1551/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.0018815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43420 samples/s/p 0:01:48 } +2024-07-26 01:12:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1553/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 1.0017839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:30,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43948 samples/s/p 0:01:45 } +2024-07-26 01:12:33,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1555/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.0016853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43979 samples/s/p 0:01:42 } +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1557/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.0015929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43248 samples/s/p 0:01:40 } +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1559/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.0015021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43180 samples/s/p 0:01:37 } +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1561/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 1.0014131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.44219 samples/s/p 0:01:34 } +2024-07-26 01:12:45,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1563/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.0013284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43517 samples/s/p 0:01:31 } +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1565/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.0012462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43540 samples/s/p 0:01:28 } +2024-07-26 01:12:51,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1567/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0011634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43761 samples/s/p 0:01:25 } +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1569/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0010881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43434 samples/s/p 0:01:22 } +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1571/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.001012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43569 samples/s/p 0:01:19 } +2024-07-26 01:13:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1573/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.0009412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43911 samples/s/p 0:01:16 } +2024-07-26 01:13:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1575/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.0008712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:03,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43189 samples/s/p 0:01:13 } +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1577/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0008029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43646 samples/s/p 0:01:10 } +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1579/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 1.000738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43437 samples/s/p 0:01:07 } +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1581/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 1.0006768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43465 samples/s/p 0:01:04 } +2024-07-26 01:13:15,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1583/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.000618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43353 samples/s/p 0:01:01 } +2024-07-26 01:13:18,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1585/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.0005626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43998 samples/s/p 0:00:58 } +2024-07-26 01:13:21,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1587/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.0005091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43076 samples/s/p 0:00:55 } +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1589/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.000458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.44138 samples/s/p 0:00:52 } +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1591/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0004088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43572 samples/s/p 0:00:50 } +2024-07-26 01:13:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1593/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0003639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:29,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43569 samples/s/p 0:00:47 } +2024-07-26 01:13:32,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1595/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.0003206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:32,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43385 samples/s/p 0:00:44 } +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1597/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 1.0002809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43456 samples/s/p 0:00:41 } +2024-07-26 01:13:38,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1599/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.0002437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:38,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43543 samples/s/p 0:00:38 } +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1601/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.0002083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43068 samples/s/p 0:00:35 } +2024-07-26 01:13:44,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1603/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.0001771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:44,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43717 samples/s/p 0:00:32 } +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1605/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.0001469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43543 samples/s/p 0:00:29 } +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1607/ 1625], loss: 1.071, per_step_time: 1473ms, lr: 1.0001202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:50,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43063 samples/s/p 0:00:26 } +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1609/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.0000967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43582 samples/s/p 0:00:23 } +2024-07-26 01:13:56,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1611/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0000743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:56,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43546 samples/s/p 0:00:20 } +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1613/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0000579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43390 samples/s/p 0:00:17 } +2024-07-26 01:14:02,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1615/ 1625], loss: 1.140, per_step_time: 1474ms, lr: 1.0000398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:02,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42619 samples/s/p 0:00:14 } +2024-07-26 01:14:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1617/ 1625], loss: 0.922, per_step_time: 1471ms, lr: 1.0000276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43799 samples/s/p 0:00:11 } +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1619/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0000164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43389 samples/s/p 0:00:08 } +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1621/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 1.0000086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.42897 samples/s/p 0:00:05 } +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1623/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.0000026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43337 samples/s/p 0:00:02 } +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1625/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.0000009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |██████████████████████████████████████████████████| 5.43070 samples/s/p 0:00:00 } +2024-07-26 01:14:17,194 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 01:14:47,801 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_3.log" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_3.log" new file mode 100644 index 00000000..f122b704 --- /dev/null +++ "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\227\245\345\277\227\346\226\207\344\273\266/worker_3.log" @@ -0,0 +1,16898 @@ +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:499: UserWarning: The value of the smallest subnormal for type is zero. + setattr(self, word, getattr(machar, word).flat[0]) +/home/ma-user/anaconda3/envs/MindSpore/lib/python3.9/site-packages/numpy/core/getlimits.py:89: UserWarning: The value of the smallest subnormal for type is zero. + return self._float_to_str(self.smallest_subnormal) +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:19.560.619 [mindspore/ccsrc/distributed/rpc/tcp/tcp_comm.cc:464] Connect] Waiting for the state of the connection to 127.0.0.1:8118 to be connected...Retry number: 1 +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:20.561.269 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(1/200). +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:23.561.447 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:194] BuildCluster] Topology build timed out., retry(2/200). +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:26.561.633 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:196] BuildCluster] Cluster is successfully initialized. +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:26.562.015 [mindspore/ccsrc/distributed/cluster/cluster_context.cc:260] PostProcess] This node 3 rank id: 3 +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:51.922.576 [mindspore/ccsrc/distributed/collective/collective_manager.cc:259] CreateCommunicationGroup] Start to create communication group: hccl_world_group [const vector]{0, 1, 2, 3} +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:51.923.167 [mindspore/ccsrc/distributed/collective/collective_manager.cc:335] CreateCommunicationGroup] Begin initialize communication group on the device side: hccl_world_group +[WARNING] DISTRIBUTED(62203,ffffae230010,python):2024-07-25-18:09:53.204.933 [mindspore/ccsrc/distributed/collective/collective_manager.cc:345] CreateCommunicationGroup] End initialize communication group on the device side: hccl_world_group +2024-07-25 18:09:53,208 - mindformers[mindformers/tools/utils.py:168] - INFO - set strategy path to './output/strategy/ckpt_strategy_rank_3.ckpt' +2024-07-25 18:09:53,244 - mindformers[mindformers/trainer/trainer.py:919] - INFO - Load configs in /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml to build trainer. +2024-07-25 18:09:53,244 - mindformers[mindformers/trainer/trainer.py:949] - INFO - ..........Init Config.......... +2024-07-25 18:09:53,244 - mindformers[mindformers/core/parallel_config.py:45] - INFO - initial recompute_config from dict: {'recompute': True, 'select_recompute': False, 'parallel_optimizer_comm_recompute': False, 'mp_comm_recompute': True, 'recompute_slice_activation': True} +2024-07-25 18:09:53,245 - mindformers[mindformers/core/parallel_config.py:51] - INFO - initial parallel_config from dict: {'data_parallel': 1, 'model_parallel': 4, 'pipeline_stage': 1, 'use_seq_parallel': False, 'micro_batch_num': 1, 'vocab_emb_dp': True, 'gradient_aggregation_group': 4} +2024-07-25 18:09:53,246 - mindformers[mindformers/tools/utils.py:153] - INFO - set output path to '/home/ma-user/work/MindFormers/mindformers/research/output' +2024-07-25 18:09:53,246 - mindformers[mindformers/trainer/base_trainer.py:85] - INFO - Now Running Task is: text_generation, Model is: llama3_8b +2024-07-25 18:09:53,246 - mindformers[mindformers/trainer/base_trainer.py:111] - WARNING - Input model name is not in the supported list or unspecified. +2024-07-25 18:09:53,247 - mindformers[mindformers/trainer/base_trainer.py:112] - WARNING - See the list of supported task and model name: ['baichuan2_13b', 'baichuan2_7b', 'baichuan_7b', 'bloom_176b', 'bloom_560m', 'bloom_65b', 'bloom_7.1b', 'codegeex2_6b', 'codellama_34b', 'common', 'deepseek_33b', 'glm2_6b', 'glm2_6b_lora', 'glm2_6b_ptuning2', 'glm3_6b', 'glm_6b', 'glm_6b_chat', 'glm_6b_lora', 'glm_6b_lora_chat', 'gpt2', 'gpt2_13b', 'gpt2_52b', 'gpt2_lora', 'gpt2_xl', 'gpt2_xl_lora', 'internlm_7b', 'internlm_7b_lora', 'llama2_13b', 'llama2_70b', 'llama2_7b', 'llama_13b', 'llama_65b', 'llama_7b', 'llama_7b_lora', 'pangualpha_13b', 'pangualpha_2_6b', 'qwen_7b', 'qwen_7b_lora', 'skywork_13b', 'yi_34b', 'yi_6b', 'ziya_13b'] +2024-07-25 18:09:53,247 - mindformers[mindformers/trainer/base_trainer.py:113] - WARNING - The default model config: /home/ma-user/work/MindFormers/mindformers/configs/gpt2/run_gpt2.yaml will now be used for the text_generation task +2024-07-25 18:09:53,247 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,247 - mindformers[mindformers/trainer/trainer.py:1027] - INFO - ..........Init Train Dataset.......... +2024-07-25 18:09:53,248 - mindformers[mindformers/trainer/trainer.py:335] - INFO - ==========Trainer Init Success!========== +2024-07-25 18:09:53,248 - mindformers[mindformers/trainer/trainer.py:476] - WARNING - The `finetune_checkpoint` will be deprecated. Please use `resume_from_checkpoint` instead. +2024-07-25 18:09:53,248 - mindformers[mindformers/trainer/trainer.py:1004] - INFO - ..........Init Model.......... +2024-07-25 18:09:53,248 - mindformers[mindformers/trainer/base_trainer.py:176] - INFO - The current parallel mode is semi_auto_parallel, full batch is True,so global batch size will be changed: global_batch_size = batch_size * data_parallel * micro_batch_interleave_num * gradient_accumulation_steps = 32 = 32 * 1 * 1 * 1 +2024-07-25 18:09:53,249 - mindformers[mindformers/trainer/base_trainer.py:624] - INFO - .........Build Dataset For Train.......... +2024-07-25 18:09:53,249 - mindformers[mindformers/trainer/base_trainer.py:353] - INFO - .........Build Dataset From Config.......... +2024-07-25 18:09:53,249 - mindformers[mindformers/dataset/causal_language_model_dataset.py:166] - INFO - Now Create Causal Language Model Dataset. +2024-07-25 18:09:53,261 - mindformers[mindformers/trainer/base_trainer.py:626] - INFO - Create train dataset finish, dataset size:1625 +2024-07-25 18:09:53,261 - mindformers[mindformers/trainer/utils.py:171] - INFO - Will be Training epochs:10, sink_size:2 +2024-07-25 18:09:53,262 - mindformers[mindformers/trainer/utils.py:173] - INFO - Create training dataset finish, dataset size:1625 +2024-07-25 18:09:53,262 - mindformers[mindformers/trainer/base_trainer.py:656] - INFO - .........Build Net For Train.......... +2024-07-25 18:09:53,262 - mindformers[mindformers/trainer/base_trainer.py:387] - INFO - .........Build Network From Config.......... +2024-07-25 18:09:53,263 - mindformers[mindformers/version_control.py:61] - INFO - The Cell Reuse compilation acceleration feature is not supported when the environment variable ENABLE_CELL_REUSE is 0 or MindSpore version is earlier than 2.1.0 or stand_alone mode or pipeline_stages <= 1 +2024-07-25 18:09:53,263 - mindformers[mindformers/version_control.py:65] - INFO - +The current ENABLE_CELL_REUSE=0, please set the environment variable as follows: +export ENABLE_CELL_REUSE=1 to enable the Cell Reuse compilation acceleration feature. +2024-07-25 18:09:53,264 - mindformers[mindformers/version_control.py:74] - INFO - The Cell Reuse compilation acceleration feature only works in pipeline parallel mode(pipeline_stage>1).Current pipeline stage=1, the feature is disabled by default. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:09:53.265.930 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:09:53.268.644 [/home/ma-user/work/MindFormers/mindformers/mindformers/modules/transformer/op_parallel_config.py:244] The optimizer shard True in auto_parallel_context is not equal to the optimizer_shard None in the OpParallelConfig. Please check the optimizer_shard to make them consistent. +2024-07-25 18:09:53,375 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:09:53.376.819 [mindspore/common/_decorator.py:40] 'Parameter' is deprecated from version 2.3 and will be removed in a future version, use 'add_pipeline_stage' instead. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:09:53.376.951 [mindspore/common/parameter.py:806] This interface may be deleted in the future. +2024-07-25 18:09:53,399 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,421 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,443 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,465 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,486 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,508 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,530 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,552 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:53,574 - mindformers[mindformers/models/llama/llama_transformer.py:468] - INFO - MoE config is None, use normal FFN +2024-07-25 18:09:54,074 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,282 - mindformers[mindformers/models/modeling_utils.py:1438] - INFO - model built, but weights is unloaded, since the config has no checkpoint_name_or_path attribute or checkpoint_name_or_path is None. +2024-07-25 18:09:54,306 - mindformers[mindformers/trainer/base_trainer.py:543] - INFO - Network Parameters: 3407872. +2024-07-25 18:09:54,306 - mindformers[mindformers/trainer/base_trainer.py:678] - INFO - .........Build Optimizer For Train.......... +2024-07-25 18:09:54,306 - mindformers[mindformers/trainer/base_trainer.py:426] - INFO - .........Build Optimizer From Config.......... +2024-07-25 18:09:54,307 - mindformers[mindformers/trainer/base_trainer.py:459] - INFO - .........Build LR Schedule From Config.......... +2024-07-25 18:09:54,312 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:74] - WARNING - dynamic_lr_schedule will be reset and invalid when layer_scale is False. +2024-07-25 18:09:54,316 - mindformers[mindformers/trainer/optimizer_grouped_parameters.py:113] - INFO - Param groups = { + "decay": { + "weight_decay": 0.0, + "params": [ + "model.layers.0.attention.wq.mindpet_delta_lora_a", + "model.layers.0.attention.wq.mindpet_delta_lora_b", + "model.layers.0.attention.wv.mindpet_delta_lora_a", + "model.layers.0.attention.wv.mindpet_delta_lora_b", + "model.layers.1.attention.wq.mindpet_delta_lora_a", + "model.layers.1.attention.wq.mindpet_delta_lora_b", + "model.layers.1.attention.wv.mindpet_delta_lora_a", + "model.layers.1.attention.wv.mindpet_delta_lora_b", + "model.layers.2.attention.wq.mindpet_delta_lora_a", + "model.layers.2.attention.wq.mindpet_delta_lora_b", + "model.layers.2.attention.wv.mindpet_delta_lora_a", + "model.layers.2.attention.wv.mindpet_delta_lora_b", + "model.layers.3.attention.wq.mindpet_delta_lora_a", + "model.layers.3.attention.wq.mindpet_delta_lora_b", + "model.layers.3.attention.wv.mindpet_delta_lora_a", + "model.layers.3.attention.wv.mindpet_delta_lora_b", + "model.layers.4.attention.wq.mindpet_delta_lora_a", + "model.layers.4.attention.wq.mindpet_delta_lora_b", + "model.layers.4.attention.wv.mindpet_delta_lora_a", + "model.layers.4.attention.wv.mindpet_delta_lora_b", + "model.layers.5.attention.wq.mindpet_delta_lora_a", + "model.layers.5.attention.wq.mindpet_delta_lora_b", + "model.layers.5.attention.wv.mindpet_delta_lora_a", + "model.layers.5.attention.wv.mindpet_delta_lora_b", + "model.layers.6.attention.wq.mindpet_delta_lora_a", + "model.layers.6.attention.wq.mindpet_delta_lora_b", + "model.layers.6.attention.wv.mindpet_delta_lora_a", + "model.layers.6.attention.wv.mindpet_delta_lora_b", + "model.layers.7.attention.wq.mindpet_delta_lora_a", + "model.layers.7.attention.wq.mindpet_delta_lora_b", + "model.layers.7.attention.wv.mindpet_delta_lora_a", + "model.layers.7.attention.wv.mindpet_delta_lora_b", + "model.layers.8.attention.wq.mindpet_delta_lora_a", + "model.layers.8.attention.wq.mindpet_delta_lora_b", + "model.layers.8.attention.wv.mindpet_delta_lora_a", + "model.layers.8.attention.wv.mindpet_delta_lora_b", + "model.layers.9.attention.wq.mindpet_delta_lora_a", + "model.layers.9.attention.wq.mindpet_delta_lora_b", + "model.layers.9.attention.wv.mindpet_delta_lora_a", + "model.layers.9.attention.wv.mindpet_delta_lora_b", + "model.layers.10.attention.wq.mindpet_delta_lora_a", + "model.layers.10.attention.wq.mindpet_delta_lora_b", + "model.layers.10.attention.wv.mindpet_delta_lora_a", + "model.layers.10.attention.wv.mindpet_delta_lora_b", + "model.layers.11.attention.wq.mindpet_delta_lora_a", + "model.layers.11.attention.wq.mindpet_delta_lora_b", + "model.layers.11.attention.wv.mindpet_delta_lora_a", + "model.layers.11.attention.wv.mindpet_delta_lora_b", + "model.layers.12.attention.wq.mindpet_delta_lora_a", + "model.layers.12.attention.wq.mindpet_delta_lora_b", + "model.layers.12.attention.wv.mindpet_delta_lora_a", + "model.layers.12.attention.wv.mindpet_delta_lora_b", + "model.layers.13.attention.wq.mindpet_delta_lora_a", + "model.layers.13.attention.wq.mindpet_delta_lora_b", + "model.layers.13.attention.wv.mindpet_delta_lora_a", + "model.layers.13.attention.wv.mindpet_delta_lora_b", + "model.layers.14.attention.wq.mindpet_delta_lora_a", + "model.layers.14.attention.wq.mindpet_delta_lora_b", + "model.layers.14.attention.wv.mindpet_delta_lora_a", + "model.layers.14.attention.wv.mindpet_delta_lora_b", + "model.layers.15.attention.wq.mindpet_delta_lora_a", + "model.layers.15.attention.wq.mindpet_delta_lora_b", + "model.layers.15.attention.wv.mindpet_delta_lora_a", + "model.layers.15.attention.wv.mindpet_delta_lora_b", + "model.layers.16.attention.wq.mindpet_delta_lora_a", + "model.layers.16.attention.wq.mindpet_delta_lora_b", + "model.layers.16.attention.wv.mindpet_delta_lora_a", + "model.layers.16.attention.wv.mindpet_delta_lora_b", + "model.layers.17.attention.wq.mindpet_delta_lora_a", + "model.layers.17.attention.wq.mindpet_delta_lora_b", + "model.layers.17.attention.wv.mindpet_delta_lora_a", + "model.layers.17.attention.wv.mindpet_delta_lora_b", + "model.layers.18.attention.wq.mindpet_delta_lora_a", + "model.layers.18.attention.wq.mindpet_delta_lora_b", + "model.layers.18.attention.wv.mindpet_delta_lora_a", + "model.layers.18.attention.wv.mindpet_delta_lora_b", + "model.layers.19.attention.wq.mindpet_delta_lora_a", + "model.layers.19.attention.wq.mindpet_delta_lora_b", + "model.layers.19.attention.wv.mindpet_delta_lora_a", + "model.layers.19.attention.wv.mindpet_delta_lora_b", + "model.layers.20.attention.wq.mindpet_delta_lora_a", + "model.layers.20.attention.wq.mindpet_delta_lora_b", + "model.layers.20.attention.wv.mindpet_delta_lora_a", + "model.layers.20.attention.wv.mindpet_delta_lora_b", + "model.layers.21.attention.wq.mindpet_delta_lora_a", + "model.layers.21.attention.wq.mindpet_delta_lora_b", + "model.layers.21.attention.wv.mindpet_delta_lora_a", + "model.layers.21.attention.wv.mindpet_delta_lora_b", + "model.layers.22.attention.wq.mindpet_delta_lora_a", + "model.layers.22.attention.wq.mindpet_delta_lora_b", + "model.layers.22.attention.wv.mindpet_delta_lora_a", + "model.layers.22.attention.wv.mindpet_delta_lora_b", + "model.layers.23.attention.wq.mindpet_delta_lora_a", + "model.layers.23.attention.wq.mindpet_delta_lora_b", + "model.layers.23.attention.wv.mindpet_delta_lora_a", + "model.layers.23.attention.wv.mindpet_delta_lora_b", + "model.layers.24.attention.wq.mindpet_delta_lora_a", + "model.layers.24.attention.wq.mindpet_delta_lora_b", + "model.layers.24.attention.wv.mindpet_delta_lora_a", + "model.layers.24.attention.wv.mindpet_delta_lora_b", + "model.layers.25.attention.wq.mindpet_delta_lora_a", + "model.layers.25.attention.wq.mindpet_delta_lora_b", + "model.layers.25.attention.wv.mindpet_delta_lora_a", + "model.layers.25.attention.wv.mindpet_delta_lora_b", + "model.layers.26.attention.wq.mindpet_delta_lora_a", + "model.layers.26.attention.wq.mindpet_delta_lora_b", + "model.layers.26.attention.wv.mindpet_delta_lora_a", + "model.layers.26.attention.wv.mindpet_delta_lora_b", + "model.layers.27.attention.wq.mindpet_delta_lora_a", + "model.layers.27.attention.wq.mindpet_delta_lora_b", + "model.layers.27.attention.wv.mindpet_delta_lora_a", + "model.layers.27.attention.wv.mindpet_delta_lora_b", + "model.layers.28.attention.wq.mindpet_delta_lora_a", + "model.layers.28.attention.wq.mindpet_delta_lora_b", + "model.layers.28.attention.wv.mindpet_delta_lora_a", + "model.layers.28.attention.wv.mindpet_delta_lora_b", + "model.layers.29.attention.wq.mindpet_delta_lora_a", + "model.layers.29.attention.wq.mindpet_delta_lora_b", + "model.layers.29.attention.wv.mindpet_delta_lora_a", + "model.layers.29.attention.wv.mindpet_delta_lora_b", + "model.layers.30.attention.wq.mindpet_delta_lora_a", + "model.layers.30.attention.wq.mindpet_delta_lora_b", + "model.layers.30.attention.wv.mindpet_delta_lora_a", + "model.layers.30.attention.wv.mindpet_delta_lora_b", + "model.layers.31.attention.wq.mindpet_delta_lora_a", + "model.layers.31.attention.wq.mindpet_delta_lora_b", + "model.layers.31.attention.wv.mindpet_delta_lora_a", + "model.layers.31.attention.wv.mindpet_delta_lora_b" + ] + } +} +2024-07-25 18:09:54,419 - mindformers[mindformers/trainer/base_trainer.py:683] - INFO - .........Build Running Wrapper From Config For Train.......... +2024-07-25 18:09:54,420 - mindformers[mindformers/trainer/base_trainer.py:496] - INFO - .........Build Model Wrapper for Train From Config.......... +2024-07-25 18:09:54,426 - mindformers[mindformers/trainer/base_trainer.py:687] - INFO - .........Build Callbacks For Train.......... +2024-07-25 18:09:54,428 - mindformers[mindformers/core/callback/callback.py:533] - INFO - Integrated_save is changed to False when using auto_parallel. +2024-07-25 18:09:54,429 - mindformers[mindformers/trainer/base_trainer.py:721] - INFO - .........Starting Init Train Model.......... +2024-07-25 18:09:54,430 - mindformers[mindformers/trainer/utils.py:736] - INFO - ............Start load checkpoint from checkpoint............ +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:35.516.012 [mindspore/train/serialization.py:1369] model.tok_embeddings.embedding_weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.662.814 [mindspore/train/serialization.py:1369] model.layers.0.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.663.778 [mindspore/train/serialization.py:1369] model.layers.0.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.664.251 [mindspore/train/serialization.py:1369] model.layers.0.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.822.304 [mindspore/train/serialization.py:1369] model.layers.0.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.864.282 [mindspore/train/serialization.py:1369] model.layers.0.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:40.906.250 [mindspore/train/serialization.py:1369] model.layers.0.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:41.525.54 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:41.640.013 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:42.234.194 [mindspore/train/serialization.py:1369] model.layers.0.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:42.820.663 [mindspore/train/serialization.py:1369] model.layers.1.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:42.821.633 [mindspore/train/serialization.py:1369] model.layers.1.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:42.822.073 [mindspore/train/serialization.py:1369] model.layers.1.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:42.967.366 [mindspore/train/serialization.py:1369] model.layers.1.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:43.768.0 [mindspore/train/serialization.py:1369] model.layers.1.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:43.476.66 [mindspore/train/serialization.py:1369] model.layers.1.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:43.195.117 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:43.792.864 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:44.384.007 [mindspore/train/serialization.py:1369] model.layers.1.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:44.974.988 [mindspore/train/serialization.py:1369] model.layers.2.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:44.975.915 [mindspore/train/serialization.py:1369] model.layers.2.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:44.976.365 [mindspore/train/serialization.py:1369] model.layers.2.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:45.116.656 [mindspore/train/serialization.py:1369] model.layers.2.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:45.174.122 [mindspore/train/serialization.py:1369] model.layers.2.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:45.214.167 [mindspore/train/serialization.py:1369] model.layers.2.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:45.356.038 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:45.942.240 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:46.520.844 [mindspore/train/serialization.py:1369] model.layers.2.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.160.719 [mindspore/train/serialization.py:1369] model.layers.3.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.161.577 [mindspore/train/serialization.py:1369] model.layers.3.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.162.026 [mindspore/train/serialization.py:1369] model.layers.3.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.340.235 [mindspore/train/serialization.py:1369] model.layers.3.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.383.554 [mindspore/train/serialization.py:1369] model.layers.3.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.425.372 [mindspore/train/serialization.py:1369] model.layers.3.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:47.609.915 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:48.196.983 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:48.790.877 [mindspore/train/serialization.py:1369] model.layers.3.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.426.855 [mindspore/train/serialization.py:1369] model.layers.4.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.427.792 [mindspore/train/serialization.py:1369] model.layers.4.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.428.230 [mindspore/train/serialization.py:1369] model.layers.4.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.588.969 [mindspore/train/serialization.py:1369] model.layers.4.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.633.580 [mindspore/train/serialization.py:1369] model.layers.4.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.672.232 [mindspore/train/serialization.py:1369] model.layers.4.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:49.851.033 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:50.438.218 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.147.02 [mindspore/train/serialization.py:1369] model.layers.4.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.636.229 [mindspore/train/serialization.py:1369] model.layers.5.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.637.079 [mindspore/train/serialization.py:1369] model.layers.5.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.637.561 [mindspore/train/serialization.py:1369] model.layers.5.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.808.815 [mindspore/train/serialization.py:1369] model.layers.5.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.847.677 [mindspore/train/serialization.py:1369] model.layers.5.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:51.884.984 [mindspore/train/serialization.py:1369] model.layers.5.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:52.670.46 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:52.693.181 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:53.306.846 [mindspore/train/serialization.py:1369] model.layers.5.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:53.927.948 [mindspore/train/serialization.py:1369] model.layers.6.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:53.928.674 [mindspore/train/serialization.py:1369] model.layers.6.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:53.929.101 [mindspore/train/serialization.py:1369] model.layers.6.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:54.118.489 [mindspore/train/serialization.py:1369] model.layers.6.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:54.156.645 [mindspore/train/serialization.py:1369] model.layers.6.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:54.194.065 [mindspore/train/serialization.py:1369] model.layers.6.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:54.371.156 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:54.940.913 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:55.519.090 [mindspore/train/serialization.py:1369] model.layers.6.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.979.85 [mindspore/train/serialization.py:1369] model.layers.7.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.988.91 [mindspore/train/serialization.py:1369] model.layers.7.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.993.40 [mindspore/train/serialization.py:1369] model.layers.7.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.277.255 [mindspore/train/serialization.py:1369] model.layers.7.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.321.934 [mindspore/train/serialization.py:1369] model.layers.7.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.369.263 [mindspore/train/serialization.py:1369] model.layers.7.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:56.539.759 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:57.116.068 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:57.703.545 [mindspore/train/serialization.py:1369] model.layers.7.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.258.340 [mindspore/train/serialization.py:1369] model.layers.8.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.259.183 [mindspore/train/serialization.py:1369] model.layers.8.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.259.615 [mindspore/train/serialization.py:1369] model.layers.8.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.446.268 [mindspore/train/serialization.py:1369] model.layers.8.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.499.885 [mindspore/train/serialization.py:1369] model.layers.8.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.543.261 [mindspore/train/serialization.py:1369] model.layers.8.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:58.728.814 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:59.319.149 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:11:59.915.905 [mindspore/train/serialization.py:1369] model.layers.8.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.522.373 [mindspore/train/serialization.py:1369] model.layers.9.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.523.234 [mindspore/train/serialization.py:1369] model.layers.9.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.523.670 [mindspore/train/serialization.py:1369] model.layers.9.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.706.366 [mindspore/train/serialization.py:1369] model.layers.9.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.756.063 [mindspore/train/serialization.py:1369] model.layers.9.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:00.816.698 [mindspore/train/serialization.py:1369] model.layers.9.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:01.518.74 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:01.678.494 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:02.272.031 [mindspore/train/serialization.py:1369] model.layers.9.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:02.859.950 [mindspore/train/serialization.py:1369] model.layers.10.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:02.860.886 [mindspore/train/serialization.py:1369] model.layers.10.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:02.861.355 [mindspore/train/serialization.py:1369] model.layers.10.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:03.289.63 [mindspore/train/serialization.py:1369] model.layers.10.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:03.807.80 [mindspore/train/serialization.py:1369] model.layers.10.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:03.131.168 [mindspore/train/serialization.py:1369] model.layers.10.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:03.304.238 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:03.882.949 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:04.483.250 [mindspore/train/serialization.py:1369] model.layers.10.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.667.33 [mindspore/train/serialization.py:1369] model.layers.11.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.675.95 [mindspore/train/serialization.py:1369] model.layers.11.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.680.38 [mindspore/train/serialization.py:1369] model.layers.11.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.239.683 [mindspore/train/serialization.py:1369] model.layers.11.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.295.174 [mindspore/train/serialization.py:1369] model.layers.11.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.369.572 [mindspore/train/serialization.py:1369] model.layers.11.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:05.539.566 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:06.112.957 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:06.673.423 [mindspore/train/serialization.py:1369] model.layers.11.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.269.081 [mindspore/train/serialization.py:1369] model.layers.12.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.269.925 [mindspore/train/serialization.py:1369] model.layers.12.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.270.354 [mindspore/train/serialization.py:1369] model.layers.12.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.442.306 [mindspore/train/serialization.py:1369] model.layers.12.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.522.771 [mindspore/train/serialization.py:1369] model.layers.12.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.574.749 [mindspore/train/serialization.py:1369] model.layers.12.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:07.763.591 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:08.381.752 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:08.963.816 [mindspore/train/serialization.py:1369] model.layers.12.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.567.954 [mindspore/train/serialization.py:1369] model.layers.13.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.568.807 [mindspore/train/serialization.py:1369] model.layers.13.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.569.234 [mindspore/train/serialization.py:1369] model.layers.13.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.768.029 [mindspore/train/serialization.py:1369] model.layers.13.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.844.815 [mindspore/train/serialization.py:1369] model.layers.13.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:09.896.086 [mindspore/train/serialization.py:1369] model.layers.13.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:10.682.01 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:10.662.744 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:11.233.488 [mindspore/train/serialization.py:1369] model.layers.13.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:11.825.104 [mindspore/train/serialization.py:1369] model.layers.14.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:11.826.085 [mindspore/train/serialization.py:1369] model.layers.14.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:11.826.546 [mindspore/train/serialization.py:1369] model.layers.14.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:12.505.5 [mindspore/train/serialization.py:1369] model.layers.14.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:12.570.25 [mindspore/train/serialization.py:1369] model.layers.14.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:12.111.611 [mindspore/train/serialization.py:1369] model.layers.14.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:12.286.976 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:12.871.176 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:13.462.045 [mindspore/train/serialization.py:1369] model.layers.14.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.600.19 [mindspore/train/serialization.py:1369] model.layers.15.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.608.98 [mindspore/train/serialization.py:1369] model.layers.15.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.613.70 [mindspore/train/serialization.py:1369] model.layers.15.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.230.031 [mindspore/train/serialization.py:1369] model.layers.15.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.282.187 [mindspore/train/serialization.py:1369] model.layers.15.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.328.174 [mindspore/train/serialization.py:1369] model.layers.15.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:14.497.874 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:15.577.85 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:15.642.953 [mindspore/train/serialization.py:1369] model.layers.15.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.210.999 [mindspore/train/serialization.py:1369] model.layers.16.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.211.801 [mindspore/train/serialization.py:1369] model.layers.16.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.212.228 [mindspore/train/serialization.py:1369] model.layers.16.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.408.787 [mindspore/train/serialization.py:1369] model.layers.16.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.475.955 [mindspore/train/serialization.py:1369] model.layers.16.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.534.443 [mindspore/train/serialization.py:1369] model.layers.16.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:16.742.991 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:17.301.035 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:17.905.900 [mindspore/train/serialization.py:1369] model.layers.16.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.498.327 [mindspore/train/serialization.py:1369] model.layers.17.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.499.510 [mindspore/train/serialization.py:1369] model.layers.17.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.500.048 [mindspore/train/serialization.py:1369] model.layers.17.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.665.986 [mindspore/train/serialization.py:1369] model.layers.17.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.766.530 [mindspore/train/serialization.py:1369] model.layers.17.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.820.343 [mindspore/train/serialization.py:1369] model.layers.17.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:18.997.550 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:19.569.795 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.145.788 [mindspore/train/serialization.py:1369] model.layers.17.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.740.212 [mindspore/train/serialization.py:1369] model.layers.18.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.741.089 [mindspore/train/serialization.py:1369] model.layers.18.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.741.549 [mindspore/train/serialization.py:1369] model.layers.18.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.908.902 [mindspore/train/serialization.py:1369] model.layers.18.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:20.962.647 [mindspore/train/serialization.py:1369] model.layers.18.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:21.352.37 [mindspore/train/serialization.py:1369] model.layers.18.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:21.212.265 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:21.806.084 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:22.386.469 [mindspore/train/serialization.py:1369] model.layers.18.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:22.969.296 [mindspore/train/serialization.py:1369] model.layers.19.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:22.970.151 [mindspore/train/serialization.py:1369] model.layers.19.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:22.970.589 [mindspore/train/serialization.py:1369] model.layers.19.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:23.139.662 [mindspore/train/serialization.py:1369] model.layers.19.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:23.187.835 [mindspore/train/serialization.py:1369] model.layers.19.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:23.230.129 [mindspore/train/serialization.py:1369] model.layers.19.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:23.423.689 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:24.372.9 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:24.575.417 [mindspore/train/serialization.py:1369] model.layers.19.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.171.430 [mindspore/train/serialization.py:1369] model.layers.20.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.172.278 [mindspore/train/serialization.py:1369] model.layers.20.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.172.731 [mindspore/train/serialization.py:1369] model.layers.20.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.346.844 [mindspore/train/serialization.py:1369] model.layers.20.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.410.585 [mindspore/train/serialization.py:1369] model.layers.20.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.461.535 [mindspore/train/serialization.py:1369] model.layers.20.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:25.626.137 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:26.236.925 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:26.804.948 [mindspore/train/serialization.py:1369] model.layers.20.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.417.374 [mindspore/train/serialization.py:1369] model.layers.21.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.418.248 [mindspore/train/serialization.py:1369] model.layers.21.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.419.088 [mindspore/train/serialization.py:1369] model.layers.21.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.643.167 [mindspore/train/serialization.py:1369] model.layers.21.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.708.392 [mindspore/train/serialization.py:1369] model.layers.21.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.753.688 [mindspore/train/serialization.py:1369] model.layers.21.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:27.940.711 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:28.498.998 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.678.43 [mindspore/train/serialization.py:1369] model.layers.21.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.641.046 [mindspore/train/serialization.py:1369] model.layers.22.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.642.022 [mindspore/train/serialization.py:1369] model.layers.22.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.642.469 [mindspore/train/serialization.py:1369] model.layers.22.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.813.417 [mindspore/train/serialization.py:1369] model.layers.22.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.864.597 [mindspore/train/serialization.py:1369] model.layers.22.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:29.917.121 [mindspore/train/serialization.py:1369] model.layers.22.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:30.913.43 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:30.668.619 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:31.232.223 [mindspore/train/serialization.py:1369] model.layers.22.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:31.816.458 [mindspore/train/serialization.py:1369] model.layers.23.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:31.817.386 [mindspore/train/serialization.py:1369] model.layers.23.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:31.817.843 [mindspore/train/serialization.py:1369] model.layers.23.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:31.994.895 [mindspore/train/serialization.py:1369] model.layers.23.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:32.445.82 [mindspore/train/serialization.py:1369] model.layers.23.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:32.970.47 [mindspore/train/serialization.py:1369] model.layers.23.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:32.273.576 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:32.859.503 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:33.442.544 [mindspore/train/serialization.py:1369] model.layers.23.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.146.33 [mindspore/train/serialization.py:1369] model.layers.24.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.154.49 [mindspore/train/serialization.py:1369] model.layers.24.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.158.69 [mindspore/train/serialization.py:1369] model.layers.24.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.189.651 [mindspore/train/serialization.py:1369] model.layers.24.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.250.526 [mindspore/train/serialization.py:1369] model.layers.24.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.306.361 [mindspore/train/serialization.py:1369] model.layers.24.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:34.487.787 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:35.669.32 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:35.639.633 [mindspore/train/serialization.py:1369] model.layers.24.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.251.025 [mindspore/train/serialization.py:1369] model.layers.25.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.251.853 [mindspore/train/serialization.py:1369] model.layers.25.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.252.277 [mindspore/train/serialization.py:1369] model.layers.25.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.421.809 [mindspore/train/serialization.py:1369] model.layers.25.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.471.574 [mindspore/train/serialization.py:1369] model.layers.25.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.532.086 [mindspore/train/serialization.py:1369] model.layers.25.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:36.707.647 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:37.271.762 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:37.865.969 [mindspore/train/serialization.py:1369] model.layers.25.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.434.652 [mindspore/train/serialization.py:1369] model.layers.26.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.435.520 [mindspore/train/serialization.py:1369] model.layers.26.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.435.951 [mindspore/train/serialization.py:1369] model.layers.26.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.629.355 [mindspore/train/serialization.py:1369] model.layers.26.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.701.682 [mindspore/train/serialization.py:1369] model.layers.26.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.757.844 [mindspore/train/serialization.py:1369] model.layers.26.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:38.942.972 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:39.561.625 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.121.306 [mindspore/train/serialization.py:1369] model.layers.26.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.726.142 [mindspore/train/serialization.py:1369] model.layers.27.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.726.982 [mindspore/train/serialization.py:1369] model.layers.27.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.727.416 [mindspore/train/serialization.py:1369] model.layers.27.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.892.003 [mindspore/train/serialization.py:1369] model.layers.27.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.942.550 [mindspore/train/serialization.py:1369] model.layers.27.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:40.990.631 [mindspore/train/serialization.py:1369] model.layers.27.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:41.158.321 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:41.726.937 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:42.299.662 [mindspore/train/serialization.py:1369] model.layers.27.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:42.867.970 [mindspore/train/serialization.py:1369] model.layers.28.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:42.868.887 [mindspore/train/serialization.py:1369] model.layers.28.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:42.869.345 [mindspore/train/serialization.py:1369] model.layers.28.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:43.373.58 [mindspore/train/serialization.py:1369] model.layers.28.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:43.885.83 [mindspore/train/serialization.py:1369] model.layers.28.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:43.136.904 [mindspore/train/serialization.py:1369] model.layers.28.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:43.314.345 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:43.878.316 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:44.450.119 [mindspore/train/serialization.py:1369] model.layers.28.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.453.64 [mindspore/train/serialization.py:1369] model.layers.29.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.463.14 [mindspore/train/serialization.py:1369] model.layers.29.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.468.07 [mindspore/train/serialization.py:1369] model.layers.29.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.235.343 [mindspore/train/serialization.py:1369] model.layers.29.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.291.113 [mindspore/train/serialization.py:1369] model.layers.29.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.351.787 [mindspore/train/serialization.py:1369] model.layers.29.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:45.531.343 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:46.109.547 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:46.679.575 [mindspore/train/serialization.py:1369] model.layers.29.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.263.481 [mindspore/train/serialization.py:1369] model.layers.30.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.264.338 [mindspore/train/serialization.py:1369] model.layers.30.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.264.766 [mindspore/train/serialization.py:1369] model.layers.30.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.433.588 [mindspore/train/serialization.py:1369] model.layers.30.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.481.871 [mindspore/train/serialization.py:1369] model.layers.30.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.530.982 [mindspore/train/serialization.py:1369] model.layers.30.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:47.719.519 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:48.312.795 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:48.882.895 [mindspore/train/serialization.py:1369] model.layers.30.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.460.008 [mindspore/train/serialization.py:1369] model.layers.31.ffn_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.460.866 [mindspore/train/serialization.py:1369] model.layers.31.attention_norm.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.461.310 [mindspore/train/serialization.py:1369] model.layers.31.attention.wq.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.629.225 [mindspore/train/serialization.py:1369] model.layers.31.attention.wk.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.680.114 [mindspore/train/serialization.py:1369] model.layers.31.attention.wv.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.727.719 [mindspore/train/serialization.py:1369] model.layers.31.attention.wo.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:49.921.453 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w1.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:50.488.100 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w2.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:51.821.49 [mindspore/train/serialization.py:1369] model.layers.31.feed_forward.w3.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:51.672.435 [mindspore/train/serialization.py:1369] model.norm_out.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:12:51.673.333 [mindspore/train/serialization.py:1369] lm_head.weight is not init while load ckpt. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:16.856.926 [mindspore/train/serialization.py:195] The type of model.layers.0.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:16.861.049 [mindspore/train/serialization.py:195] The type of model.layers.0.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:23.983.135 [mindspore/train/serialization.py:195] The type of model.layers.1.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:23.986.914 [mindspore/train/serialization.py:195] The type of model.layers.1.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:31.942.97 [mindspore/train/serialization.py:195] The type of model.layers.2.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:31.981.08 [mindspore/train/serialization.py:195] The type of model.layers.2.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:38.152.242 [mindspore/train/serialization.py:195] The type of model.layers.3.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:38.156.072 [mindspore/train/serialization.py:195] The type of model.layers.3.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:45.158.779 [mindspore/train/serialization.py:195] The type of model.layers.4.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:45.162.737 [mindspore/train/serialization.py:195] The type of model.layers.4.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:52.194.597 [mindspore/train/serialization.py:195] The type of model.layers.5.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:52.198.435 [mindspore/train/serialization.py:195] The type of model.layers.5.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:59.162.811 [mindspore/train/serialization.py:195] The type of model.layers.6.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:13:59.166.685 [mindspore/train/serialization.py:195] The type of model.layers.6.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:06.144.887 [mindspore/train/serialization.py:195] The type of model.layers.7.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:06.148.758 [mindspore/train/serialization.py:195] The type of model.layers.7.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:13.126.093 [mindspore/train/serialization.py:195] The type of model.layers.8.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:13.130.100 [mindspore/train/serialization.py:195] The type of model.layers.8.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:20.204.534 [mindspore/train/serialization.py:195] The type of model.layers.9.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:20.208.366 [mindspore/train/serialization.py:195] The type of model.layers.9.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:27.175.399 [mindspore/train/serialization.py:195] The type of model.layers.10.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:27.179.268 [mindspore/train/serialization.py:195] The type of model.layers.10.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:34.162.319 [mindspore/train/serialization.py:195] The type of model.layers.11.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:34.166.173 [mindspore/train/serialization.py:195] The type of model.layers.11.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:41.119.527 [mindspore/train/serialization.py:195] The type of model.layers.12.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:41.123.520 [mindspore/train/serialization.py:195] The type of model.layers.12.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:48.178.286 [mindspore/train/serialization.py:195] The type of model.layers.13.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:48.182.127 [mindspore/train/serialization.py:195] The type of model.layers.13.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:55.214.564 [mindspore/train/serialization.py:195] The type of model.layers.14.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:14:55.218.425 [mindspore/train/serialization.py:195] The type of model.layers.14.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:02.204.354 [mindspore/train/serialization.py:195] The type of model.layers.15.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:02.208.250 [mindspore/train/serialization.py:195] The type of model.layers.15.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:09.199.736 [mindspore/train/serialization.py:195] The type of model.layers.16.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:09.203.739 [mindspore/train/serialization.py:195] The type of model.layers.16.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:16.156.680 [mindspore/train/serialization.py:195] The type of model.layers.17.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:16.160.454 [mindspore/train/serialization.py:195] The type of model.layers.17.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:23.161.086 [mindspore/train/serialization.py:195] The type of model.layers.18.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:23.164.952 [mindspore/train/serialization.py:195] The type of model.layers.18.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:30.119.814 [mindspore/train/serialization.py:195] The type of model.layers.19.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:30.123.787 [mindspore/train/serialization.py:195] The type of model.layers.19.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:37.161.516 [mindspore/train/serialization.py:195] The type of model.layers.20.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:37.165.424 [mindspore/train/serialization.py:195] The type of model.layers.20.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:44.130.204 [mindspore/train/serialization.py:195] The type of model.layers.21.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:44.134.028 [mindspore/train/serialization.py:195] The type of model.layers.21.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:51.924.43 [mindspore/train/serialization.py:195] The type of model.layers.22.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:51.963.54 [mindspore/train/serialization.py:195] The type of model.layers.22.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:58.629.12 [mindspore/train/serialization.py:195] The type of model.layers.23.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:15:58.669.20 [mindspore/train/serialization.py:195] The type of model.layers.23.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:05.784.19 [mindspore/train/serialization.py:195] The type of model.layers.24.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:05.823.38 [mindspore/train/serialization.py:195] The type of model.layers.24.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:12.600.31 [mindspore/train/serialization.py:195] The type of model.layers.25.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:12.638.59 [mindspore/train/serialization.py:195] The type of model.layers.25.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:19.339.17 [mindspore/train/serialization.py:195] The type of model.layers.26.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:19.377.84 [mindspore/train/serialization.py:195] The type of model.layers.26.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:25.979.084 [mindspore/train/serialization.py:195] The type of model.layers.27.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:25.983.098 [mindspore/train/serialization.py:195] The type of model.layers.27.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:33.813.03 [mindspore/train/serialization.py:195] The type of model.layers.28.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:33.852.56 [mindspore/train/serialization.py:195] The type of model.layers.28.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:40.129.888 [mindspore/train/serialization.py:195] The type of model.layers.29.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:40.133.921 [mindspore/train/serialization.py:195] The type of model.layers.29.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:47.177.628 [mindspore/train/serialization.py:195] The type of model.layers.30.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:47.181.564 [mindspore/train/serialization.py:195] The type of model.layers.30.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:54.207.383 [mindspore/train/serialization.py:195] The type of model.layers.31.ffn_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:16:54.211.409 [mindspore/train/serialization.py:195] The type of model.layers.31.attention_norm.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:17:01.280.427 [mindspore/train/serialization.py:195] The type of model.norm_out.weight:BFloat16 in 'parameter_dict' is different from the type of it in 'net':Float32, then the type convert from BFloat16 to Float32 in the network. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:17:18.500.561 [mindspore/train/serialization.py:1456] For 'load_param_into_net', 128 parameters in the 'net' are not loaded, because they are not in the 'parameter_dict', please check whether the network structure is consistent when training and loading checkpoint. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:17:18.500.980 [mindspore/train/serialization.py:1460] ['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'] are not loaded. +2024-07-25 18:17:18,501 - mindformers[mindformers/trainer/utils.py:767] - INFO - Network parameters are not loaded: (['model.layers.0.attention.wq.mindpet_delta_lora_a', 'model.layers.0.attention.wq.mindpet_delta_lora_b', 'model.layers.0.attention.wv.mindpet_delta_lora_a', 'model.layers.0.attention.wv.mindpet_delta_lora_b', 'model.layers.1.attention.wq.mindpet_delta_lora_a', 'model.layers.1.attention.wq.mindpet_delta_lora_b', 'model.layers.1.attention.wv.mindpet_delta_lora_a', 'model.layers.1.attention.wv.mindpet_delta_lora_b', 'model.layers.2.attention.wq.mindpet_delta_lora_a', 'model.layers.2.attention.wq.mindpet_delta_lora_b', 'model.layers.2.attention.wv.mindpet_delta_lora_a', 'model.layers.2.attention.wv.mindpet_delta_lora_b', 'model.layers.3.attention.wq.mindpet_delta_lora_a', 'model.layers.3.attention.wq.mindpet_delta_lora_b', 'model.layers.3.attention.wv.mindpet_delta_lora_a', 'model.layers.3.attention.wv.mindpet_delta_lora_b', 'model.layers.4.attention.wq.mindpet_delta_lora_a', 'model.layers.4.attention.wq.mindpet_delta_lora_b', 'model.layers.4.attention.wv.mindpet_delta_lora_a', 'model.layers.4.attention.wv.mindpet_delta_lora_b', 'model.layers.5.attention.wq.mindpet_delta_lora_a', 'model.layers.5.attention.wq.mindpet_delta_lora_b', 'model.layers.5.attention.wv.mindpet_delta_lora_a', 'model.layers.5.attention.wv.mindpet_delta_lora_b', 'model.layers.6.attention.wq.mindpet_delta_lora_a', 'model.layers.6.attention.wq.mindpet_delta_lora_b', 'model.layers.6.attention.wv.mindpet_delta_lora_a', 'model.layers.6.attention.wv.mindpet_delta_lora_b', 'model.layers.7.attention.wq.mindpet_delta_lora_a', 'model.layers.7.attention.wq.mindpet_delta_lora_b', 'model.layers.7.attention.wv.mindpet_delta_lora_a', 'model.layers.7.attention.wv.mindpet_delta_lora_b', 'model.layers.8.attention.wq.mindpet_delta_lora_a', 'model.layers.8.attention.wq.mindpet_delta_lora_b', 'model.layers.8.attention.wv.mindpet_delta_lora_a', 'model.layers.8.attention.wv.mindpet_delta_lora_b', 'model.layers.9.attention.wq.mindpet_delta_lora_a', 'model.layers.9.attention.wq.mindpet_delta_lora_b', 'model.layers.9.attention.wv.mindpet_delta_lora_a', 'model.layers.9.attention.wv.mindpet_delta_lora_b', 'model.layers.10.attention.wq.mindpet_delta_lora_a', 'model.layers.10.attention.wq.mindpet_delta_lora_b', 'model.layers.10.attention.wv.mindpet_delta_lora_a', 'model.layers.10.attention.wv.mindpet_delta_lora_b', 'model.layers.11.attention.wq.mindpet_delta_lora_a', 'model.layers.11.attention.wq.mindpet_delta_lora_b', 'model.layers.11.attention.wv.mindpet_delta_lora_a', 'model.layers.11.attention.wv.mindpet_delta_lora_b', 'model.layers.12.attention.wq.mindpet_delta_lora_a', 'model.layers.12.attention.wq.mindpet_delta_lora_b', 'model.layers.12.attention.wv.mindpet_delta_lora_a', 'model.layers.12.attention.wv.mindpet_delta_lora_b', 'model.layers.13.attention.wq.mindpet_delta_lora_a', 'model.layers.13.attention.wq.mindpet_delta_lora_b', 'model.layers.13.attention.wv.mindpet_delta_lora_a', 'model.layers.13.attention.wv.mindpet_delta_lora_b', 'model.layers.14.attention.wq.mindpet_delta_lora_a', 'model.layers.14.attention.wq.mindpet_delta_lora_b', 'model.layers.14.attention.wv.mindpet_delta_lora_a', 'model.layers.14.attention.wv.mindpet_delta_lora_b', 'model.layers.15.attention.wq.mindpet_delta_lora_a', 'model.layers.15.attention.wq.mindpet_delta_lora_b', 'model.layers.15.attention.wv.mindpet_delta_lora_a', 'model.layers.15.attention.wv.mindpet_delta_lora_b', 'model.layers.16.attention.wq.mindpet_delta_lora_a', 'model.layers.16.attention.wq.mindpet_delta_lora_b', 'model.layers.16.attention.wv.mindpet_delta_lora_a', 'model.layers.16.attention.wv.mindpet_delta_lora_b', 'model.layers.17.attention.wq.mindpet_delta_lora_a', 'model.layers.17.attention.wq.mindpet_delta_lora_b', 'model.layers.17.attention.wv.mindpet_delta_lora_a', 'model.layers.17.attention.wv.mindpet_delta_lora_b', 'model.layers.18.attention.wq.mindpet_delta_lora_a', 'model.layers.18.attention.wq.mindpet_delta_lora_b', 'model.layers.18.attention.wv.mindpet_delta_lora_a', 'model.layers.18.attention.wv.mindpet_delta_lora_b', 'model.layers.19.attention.wq.mindpet_delta_lora_a', 'model.layers.19.attention.wq.mindpet_delta_lora_b', 'model.layers.19.attention.wv.mindpet_delta_lora_a', 'model.layers.19.attention.wv.mindpet_delta_lora_b', 'model.layers.20.attention.wq.mindpet_delta_lora_a', 'model.layers.20.attention.wq.mindpet_delta_lora_b', 'model.layers.20.attention.wv.mindpet_delta_lora_a', 'model.layers.20.attention.wv.mindpet_delta_lora_b', 'model.layers.21.attention.wq.mindpet_delta_lora_a', 'model.layers.21.attention.wq.mindpet_delta_lora_b', 'model.layers.21.attention.wv.mindpet_delta_lora_a', 'model.layers.21.attention.wv.mindpet_delta_lora_b', 'model.layers.22.attention.wq.mindpet_delta_lora_a', 'model.layers.22.attention.wq.mindpet_delta_lora_b', 'model.layers.22.attention.wv.mindpet_delta_lora_a', 'model.layers.22.attention.wv.mindpet_delta_lora_b', 'model.layers.23.attention.wq.mindpet_delta_lora_a', 'model.layers.23.attention.wq.mindpet_delta_lora_b', 'model.layers.23.attention.wv.mindpet_delta_lora_a', 'model.layers.23.attention.wv.mindpet_delta_lora_b', 'model.layers.24.attention.wq.mindpet_delta_lora_a', 'model.layers.24.attention.wq.mindpet_delta_lora_b', 'model.layers.24.attention.wv.mindpet_delta_lora_a', 'model.layers.24.attention.wv.mindpet_delta_lora_b', 'model.layers.25.attention.wq.mindpet_delta_lora_a', 'model.layers.25.attention.wq.mindpet_delta_lora_b', 'model.layers.25.attention.wv.mindpet_delta_lora_a', 'model.layers.25.attention.wv.mindpet_delta_lora_b', 'model.layers.26.attention.wq.mindpet_delta_lora_a', 'model.layers.26.attention.wq.mindpet_delta_lora_b', 'model.layers.26.attention.wv.mindpet_delta_lora_a', 'model.layers.26.attention.wv.mindpet_delta_lora_b', 'model.layers.27.attention.wq.mindpet_delta_lora_a', 'model.layers.27.attention.wq.mindpet_delta_lora_b', 'model.layers.27.attention.wv.mindpet_delta_lora_a', 'model.layers.27.attention.wv.mindpet_delta_lora_b', 'model.layers.28.attention.wq.mindpet_delta_lora_a', 'model.layers.28.attention.wq.mindpet_delta_lora_b', 'model.layers.28.attention.wv.mindpet_delta_lora_a', 'model.layers.28.attention.wv.mindpet_delta_lora_b', 'model.layers.29.attention.wq.mindpet_delta_lora_a', 'model.layers.29.attention.wq.mindpet_delta_lora_b', 'model.layers.29.attention.wv.mindpet_delta_lora_a', 'model.layers.29.attention.wv.mindpet_delta_lora_b', 'model.layers.30.attention.wq.mindpet_delta_lora_a', 'model.layers.30.attention.wq.mindpet_delta_lora_b', 'model.layers.30.attention.wv.mindpet_delta_lora_a', 'model.layers.30.attention.wv.mindpet_delta_lora_b', 'model.layers.31.attention.wq.mindpet_delta_lora_a', 'model.layers.31.attention.wq.mindpet_delta_lora_b', 'model.layers.31.attention.wv.mindpet_delta_lora_a', 'model.layers.31.attention.wv.mindpet_delta_lora_b'], []) +2024-07-25 18:17:18,502 - mindformers[mindformers/trainer/base_trainer.py:770] - INFO - .........Starting Training Model.......... +2024-07-25 18:17:18,502 - mindformers[mindformers/trainer/base_trainer.py:773] - INFO - .........Model Compiling, Please Wait a Moment........... +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:17:18.503.536 [mindspore/train/model.py:1120] For MFLossMonitor callback, {'step_end', 'epoch_end', 'step_begin', 'epoch_begin'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] ME(62203:281473603272720,MainProcess):2024-07-25-18:17:18.503.670 [mindspore/train/model.py:1120] For Local2ObsMonitor callback, {'step_end', 'epoch_end'} methods may not be supported in later version, Use methods prefixed with 'on_train' or 'on_eval' instead when using customized callbacks. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.973.700 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.974.438 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.975.112 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.975.777 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.976.435 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.977.095 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.977.815 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.978.483 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.979.139 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.979.787 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.980.442 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.981.088 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.981.760 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.982.411 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.983.075 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.983.724 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.984.367 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.985.015 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.985.683 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.986.328 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.986.975 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.987.620 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.988.285 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.988.940 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.989.620 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.990.269 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.990.912 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.991.552 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.992.191 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.992.824 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.993.505 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.994.142 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wq-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.994.594 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/0-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.995.308 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/1-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.996.035 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/2-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.996.753 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/3-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.997.506 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/4-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.998.241 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/5-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.998.972 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/6-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:45.999.688 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/7-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.000.411 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/8-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.001.146 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/9-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.001.896 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/10-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.002.622 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/11-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.003.331 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/12-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.004.040 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/13-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.004.751 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/14-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.005.473 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/15-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.006.172 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/16-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.006.885 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/17-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.007.566 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/18-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.008.244 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/19-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.008.928 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/20-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.009.632 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/21-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.010.328 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/22-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.011.004 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/23-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.011.651 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/24-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.012.271 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/25-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.012.890 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/26-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.013.526 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/27-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.014.140 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/28-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.014.749 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/29-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.015.382 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/30-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:46.015.991 [mindspore/ccsrc/frontend/parallel/step_parallel.cc:1929] ReshapeInit] FindNextLayout for recompute_Default/network-MFTrainOneStepCell/network-_VirtualDatasetCell/_backbone-PetModel/pet_model-LoraModel/lora_model-LlamaForCausalLM/model-LlamaModel/layers-CellList/31-LLamaDecodeLayer/attention-LLamaAttention/wv-LoRADense/Reshape-op0 return nullptr, and is_next_reshape is 1. If reshape is not the last primitive, there must be some error. +[WARNING] PARALLEL(62203,ffffae230010,python):2024-07-25-18:17:48.535.992 [mindspore/ccsrc/frontend/parallel/graph_util/graph_utils.cc:68] GetTensorRedistributionFromCNode] Default/network-MFTrainOneStepCell/clip_grad_norm-ClipGradNorm/Sqrt-op0 has no OperatorInfo. +- \ | / - \ 2024-07-25 18:28:34,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 2/ 1625], loss: 1.518, per_step_time: 337404ms, lr: 1.8461538e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:34,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 0.02371 samples/s/p 63 days, 10:49:01 } +2024-07-25 18:28:38,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 4/ 1625], loss: 1.444, per_step_time: 1479ms, lr: 5.538461e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:38,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.40697 samples/s/p 6:40:37 } +2024-07-25 18:28:41,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 6/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 9.230769e-08, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:41,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.42950 samples/s/p 6:38:54 } +2024-07-25 18:28:44,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 8/ 1625], loss: 1.351, per_step_time: 1479ms, lr: 1.2923077e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:44,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.0% | | 5.40764 samples/s/p 6:40:28 } +2024-07-25 18:28:47,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 10/ 1625], loss: 1.390, per_step_time: 1470ms, lr: 1.6615384e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:47,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.44183 samples/s/p 6:37:54 } +2024-07-25 18:28:50,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 12/ 1625], loss: 1.383, per_step_time: 1472ms, lr: 2.0307691e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:50,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43294 samples/s/p 6:38:30 } +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 14/ 1625], loss: 1.447, per_step_time: 1470ms, lr: 2.4e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:52,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43865 samples/s/p 6:38:02 } +2024-07-25 18:28:55,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 16/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.7692306e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:55,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43014 samples/s/p 6:38:36 } +2024-07-25 18:28:58,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 18/ 1625], loss: 1.406, per_step_time: 1474ms, lr: 3.1384613e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:28:58,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42710 samples/s/p 6:38:47 } +2024-07-25 18:29:01,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 20/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 3.5076923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:01,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43308 samples/s/p 6:38:18 } +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 22/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 3.876923e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:04,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.42818 samples/s/p 6:38:36 } +2024-07-25 18:29:07,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 24/ 1625], loss: 1.562, per_step_time: 1471ms, lr: 4.2461537e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:07,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.1% | | 5.43559 samples/s/p 6:38:01 } +2024-07-25 18:29:10,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 26/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 4.6153846e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:10,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43680 samples/s/p 6:37:52 } +2024-07-25 18:29:13,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 28/ 1625], loss: 1.523, per_step_time: 1471ms, lr: 4.9846153e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:13,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43556 samples/s/p 6:37:55 } +2024-07-25 18:29:16,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 30/ 1625], loss: 1.471, per_step_time: 1473ms, lr: 5.3538463e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:16,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42893 samples/s/p 6:38:21 } +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 32/ 1625], loss: 1.504, per_step_time: 1471ms, lr: 5.7230767e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:19,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43600 samples/s/p 6:37:47 } +2024-07-25 18:29:22,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 34/ 1625], loss: 1.483, per_step_time: 1471ms, lr: 6.092307e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:22,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43514 samples/s/p 6:37:48 } +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 36/ 1625], loss: 1.478, per_step_time: 1471ms, lr: 6.461538e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:25,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.43549 samples/s/p 6:37:43 } +2024-07-25 18:29:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 38/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 6.8307685e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42815 samples/s/p 6:38:13 } +2024-07-25 18:29:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 40/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 7.2e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:31,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.2% | | 5.42552 samples/s/p 6:38:21 } +2024-07-25 18:29:34,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 42/ 1625], loss: 1.627, per_step_time: 1472ms, lr: 7.5692304e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:34,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43145 samples/s/p 6:37:52 } +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 44/ 1625], loss: 1.519, per_step_time: 1471ms, lr: 7.9384614e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:37,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43729 samples/s/p 6:37:24 } +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 46/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 8.307692e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:40,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43027 samples/s/p 6:37:52 } +2024-07-25 18:29:43,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 48/ 1625], loss: 1.576, per_step_time: 1471ms, lr: 8.676922e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:43,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43505 samples/s/p 6:37:28 } +2024-07-25 18:29:46,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 50/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 9.046154e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:46,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42805 samples/s/p 6:37:55 } +2024-07-25 18:29:49,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 52/ 1625], loss: 1.520, per_step_time: 1472ms, lr: 9.4153836e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:49,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.43148 samples/s/p 6:37:37 } +2024-07-25 18:29:52,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 54/ 1625], loss: 1.476, per_step_time: 1473ms, lr: 9.784615e-07, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:52,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42950 samples/s/p 6:37:43 } +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 56/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 1.0153847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.3% | | 5.42948 samples/s/p 6:37:40 } +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 58/ 1625], loss: 1.420, per_step_time: 1473ms, lr: 1.0523077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:29:57,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42763 samples/s/p 6:37:46 } +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 60/ 1625], loss: 1.523, per_step_time: 1474ms, lr: 1.0892308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:00,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.42702 samples/s/p 6:37:45 } +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 62/ 1625], loss: 1.416, per_step_time: 1473ms, lr: 1.1261538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:03,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43053 samples/s/p 6:37:27 } +2024-07-25 18:30:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 64/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.1630768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:06,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43068 samples/s/p 6:37:23 } +2024-07-25 18:30:09,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 66/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 1.1999999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43434 samples/s/p 6:37:04 } +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 68/ 1625], loss: 1.436, per_step_time: 1471ms, lr: 1.236923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:12,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43563 samples/s/p 6:36:56 } +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 70/ 1625], loss: 1.423, per_step_time: 1471ms, lr: 1.2738461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:15,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43827 samples/s/p 6:36:41 } +2024-07-25 18:30:18,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 72/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.3107691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:18,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.4% | | 5.43602 samples/s/p 6:36:48 } +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 74/ 1625], loss: 1.433, per_step_time: 1475ms, lr: 1.3476922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42246 samples/s/p 6:37:45 } +2024-07-25 18:30:24,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 76/ 1625], loss: 1.482, per_step_time: 1472ms, lr: 1.3846154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43200 samples/s/p 6:37:00 } +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 78/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.4215384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:27,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42856 samples/s/p 6:37:12 } +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 80/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 1.4584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:30,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42973 samples/s/p 6:37:04 } +2024-07-25 18:30:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 82/ 1625], loss: 1.471, per_step_time: 1474ms, lr: 1.4953846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42510 samples/s/p 6:37:21 } +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 84/ 1625], loss: 1.493, per_step_time: 1472ms, lr: 1.5323077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:36,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43349 samples/s/p 6:36:42 } +2024-07-25 18:30:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 86/ 1625], loss: 1.431, per_step_time: 1473ms, lr: 1.5692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.42852 samples/s/p 6:37:00 } +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 88/ 1625], loss: 1.613, per_step_time: 1471ms, lr: 1.6061538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:42,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.5% | | 5.43832 samples/s/p 6:36:14 } +2024-07-25 18:30:45,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 90/ 1625], loss: 1.673, per_step_time: 1483ms, lr: 1.6430769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:45,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.39375 samples/s/p 6:39:28 } +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 92/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 1.6799999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:48,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43631 samples/s/p 6:36:17 } +2024-07-25 18:30:51,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 94/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.716923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:51,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43567 samples/s/p 6:36:17 } +2024-07-25 18:30:54,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 96/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.753846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:54,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43612 samples/s/p 6:36:12 } +2024-07-25 18:30:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 98/ 1625], loss: 1.372, per_step_time: 1470ms, lr: 1.7907691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:57,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.44061 samples/s/p 6:35:50 } +2024-07-25 18:30:59,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 100/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.8276922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:30:59,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43797 samples/s/p 6:35:58 } +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 102/ 1625], loss: 1.413, per_step_time: 1472ms, lr: 1.8646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:02,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43335 samples/s/p 6:36:16 } +2024-07-25 18:31:05,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 104/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.9015384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:05,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.6% | | 5.43180 samples/s/p 6:36:19 } +2024-07-25 18:31:08,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 106/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.9384615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:08,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.42707 samples/s/p 6:36:37 } +2024-07-25 18:31:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 108/ 1625], loss: 1.504, per_step_time: 1472ms, lr: 1.9753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43449 samples/s/p 6:36:02 } +2024-07-25 18:31:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 110/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.0123075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:14,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43685 samples/s/p 6:35:49 } +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 112/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.0492307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43751 samples/s/p 6:35:43 } +2024-07-25 18:31:20,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 114/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.0861537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:20,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43941 samples/s/p 6:35:31 } +2024-07-25 18:31:23,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 116/ 1625], loss: 1.443, per_step_time: 1471ms, lr: 2.1230767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:23,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43693 samples/s/p 6:35:39 } +2024-07-25 18:31:26,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 118/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.16e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:26,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.43684 samples/s/p 6:35:37 } +2024-07-25 18:31:29,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 120/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.1969229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:29,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.7% | | 5.42987 samples/s/p 6:36:04 } +2024-07-25 18:31:32,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 122/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 2.233846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:32,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43528 samples/s/p 6:35:38 } +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 124/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 2.270769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:35,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43355 samples/s/p 6:35:42 } +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 126/ 1625], loss: 1.199, per_step_time: 1475ms, lr: 2.307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:38,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42295 samples/s/p 6:36:26 } +2024-07-25 18:31:41,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 128/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.3446153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:41,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43649 samples/s/p 6:35:24 } +2024-07-25 18:31:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 130/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.3815385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42495 samples/s/p 6:36:11 } +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 132/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.4184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43394 samples/s/p 6:35:29 } +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 134/ 1625], loss: 1.484, per_step_time: 1472ms, lr: 2.4553847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:50,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43446 samples/s/p 6:35:24 } +2024-07-25 18:31:53,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 136/ 1625], loss: 1.322, per_step_time: 1473ms, lr: 2.4923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:53,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.42784 samples/s/p 6:35:50 } +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 138/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 2.5292306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:56,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.8% | | 5.43473 samples/s/p 6:35:17 } +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 140/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 2.5661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:31:58,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43322 samples/s/p 6:35:20 } +2024-07-25 18:32:01,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 142/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6030768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:01,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43232 samples/s/p 6:35:21 } +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 144/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.6399998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:04,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43245 samples/s/p 6:35:18 } +2024-07-25 18:32:07,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 146/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.676923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:07,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43360 samples/s/p 6:35:10 } +2024-07-25 18:32:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 148/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.713846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:10,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43112 samples/s/p 6:35:18 } +2024-07-25 18:32:13,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 150/ 1625], loss: 1.384, per_step_time: 1470ms, lr: 2.7507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:13,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.44032 samples/s/p 6:34:35 } +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 152/ 1625], loss: 1.442, per_step_time: 1471ms, lr: 2.7876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:16,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43572 samples/s/p 6:34:52 } +2024-07-25 18:32:19,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 154/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8246152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:19,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 0.9% | | 5.43308 samples/s/p 6:35:00 } +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 156/ 1625], loss: 1.473, per_step_time: 1471ms, lr: 2.8615384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:22,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43740 samples/s/p 6:34:38 } +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 158/ 1625], loss: 1.352, per_step_time: 1471ms, lr: 2.8984614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:25,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43509 samples/s/p 6:34:46 } +2024-07-25 18:32:28,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 160/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9353844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:28,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.42992 samples/s/p 6:35:05 } +2024-07-25 18:32:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 162/ 1625], loss: 1.487, per_step_time: 1472ms, lr: 2.9723076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:31,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43331 samples/s/p 6:34:47 } +2024-07-25 18:32:34,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 164/ 1625], loss: 1.285, per_step_time: 1470ms, lr: 3.0092306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:34,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43855 samples/s/p 6:34:22 } +2024-07-25 18:32:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 166/ 1625], loss: 1.387, per_step_time: 1472ms, lr: 3.0461536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43270 samples/s/p 6:34:44 } +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 168/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 3.0830768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:40,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43665 samples/s/p 6:34:24 } +2024-07-25 18:32:43,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 170/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 3.1199997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:43,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.0% | | 5.43084 samples/s/p 6:34:46 } +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 172/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 3.156923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43368 samples/s/p 6:34:31 } +2024-07-25 18:32:49,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 174/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 3.1938462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:49,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43219 samples/s/p 6:34:35 } +2024-07-25 18:32:52,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 176/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 3.2307692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:52,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43197 samples/s/p 6:34:33 } +2024-07-25 18:32:55,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 178/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 3.2676921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:55,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43544 samples/s/p 6:34:15 } +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 180/ 1625], loss: 1.463, per_step_time: 1472ms, lr: 3.3046153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:32:58,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43338 samples/s/p 6:34:21 } +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 182/ 1625], loss: 1.410, per_step_time: 1473ms, lr: 3.3415383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:00,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42969 samples/s/p 6:34:34 } +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 184/ 1625], loss: 1.516, per_step_time: 1471ms, lr: 3.3784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:03,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.43793 samples/s/p 6:33:55 } +2024-07-25 18:33:06,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 186/ 1625], loss: 1.353, per_step_time: 1473ms, lr: 3.4153845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:06,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.1% | | 5.42922 samples/s/p 6:34:30 } +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 188/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 3.4523075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:09,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43398 samples/s/p 6:34:06 } +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 190/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.4892307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:12,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43094 samples/s/p 6:34:17 } +2024-07-25 18:33:15,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 192/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 3.5261537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:15,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.42758 samples/s/p 6:34:28 } +2024-07-25 18:33:18,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 194/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 3.5630767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:18,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43271 samples/s/p 6:34:03 } +2024-07-25 18:33:21,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 196/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 3.6e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:21,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43463 samples/s/p 6:33:52 } +2024-07-25 18:33:24,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 198/ 1625], loss: 1.411, per_step_time: 1473ms, lr: 3.6369229e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:24,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43065 samples/s/p 6:34:06 } +2024-07-25 18:33:27,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 200/ 1625], loss: 1.502, per_step_time: 1472ms, lr: 3.6738459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:27,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43423 samples/s/p 6:33:48 } +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 202/ 1625], loss: 1.411, per_step_time: 1471ms, lr: 3.710769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:30,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.2% | | 5.43747 samples/s/p 6:33:30 } +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 204/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 3.747692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:33,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43251 samples/s/p 6:33:49 } +2024-07-25 18:33:36,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 206/ 1625], loss: 1.352, per_step_time: 1473ms, lr: 3.784615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:36,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42881 samples/s/p 6:34:02 } +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 208/ 1625], loss: 1.262, per_step_time: 1472ms, lr: 3.8215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:39,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43305 samples/s/p 6:33:41 } +2024-07-25 18:33:42,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 210/ 1625], loss: 1.391, per_step_time: 1473ms, lr: 3.8584612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42954 samples/s/p 6:33:53 } +2024-07-25 18:33:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 212/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 3.8953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.43972 samples/s/p 6:33:06 } +2024-07-25 18:33:48,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 214/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 3.932307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:48,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42567 samples/s/p 6:34:04 } +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 216/ 1625], loss: 1.471, per_step_time: 1470ms, lr: 3.969231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:51,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.44107 samples/s/p 6:32:54 } +2024-07-25 18:33:54,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 218/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 4.0061536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:54,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.3% | | 5.42921 samples/s/p 6:33:43 } +2024-07-25 18:33:57,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 220/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.043077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:33:57,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43673 samples/s/p 6:33:07 } +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 222/ 1625], loss: 1.240, per_step_time: 1474ms, lr: 4.0799996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:00,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42667 samples/s/p 6:33:48 } +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 224/ 1625], loss: 1.427, per_step_time: 1471ms, lr: 4.116923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:02,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43616 samples/s/p 6:33:04 } +2024-07-25 18:34:05,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 226/ 1625], loss: 1.358, per_step_time: 1471ms, lr: 4.153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:05,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43745 samples/s/p 6:32:55 } +2024-07-25 18:34:08,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 228/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.1907692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:08,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43417 samples/s/p 6:33:07 } +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 230/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 4.227692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:11,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.42657 samples/s/p 6:33:37 } +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 232/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 4.264615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:14,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43054 samples/s/p 6:33:16 } +2024-07-25 18:34:17,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 234/ 1625], loss: 1.391, per_step_time: 1472ms, lr: 4.301538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:17,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.4% | | 5.43293 samples/s/p 6:33:03 } +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 236/ 1625], loss: 1.328, per_step_time: 1475ms, lr: 4.338461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42242 samples/s/p 6:33:46 } +2024-07-25 18:34:23,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 238/ 1625], loss: 1.468, per_step_time: 1472ms, lr: 4.375385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:23,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43466 samples/s/p 6:32:50 } +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 240/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 4.4123076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43378 samples/s/p 6:32:51 } +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 242/ 1625], loss: 1.520, per_step_time: 1475ms, lr: 4.449231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:29,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42181 samples/s/p 6:33:40 } +2024-07-25 18:34:32,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 244/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 4.4861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:32,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.42886 samples/s/p 6:33:06 } +2024-07-25 18:34:35,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 246/ 1625], loss: 1.449, per_step_time: 1473ms, lr: 4.5230768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:35,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43056 samples/s/p 6:32:56 } +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 248/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 4.5599995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:38,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43803 samples/s/p 6:32:20 } +2024-07-25 18:34:41,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 250/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 4.596923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:41,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.5% | | 5.43036 samples/s/p 6:32:51 } +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 252/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 4.633846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:44,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43477 samples/s/p 6:32:29 } +2024-07-25 18:34:47,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 254/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 4.670769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:47,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43215 samples/s/p 6:32:37 } +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 256/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 4.707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:50,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.44257 samples/s/p 6:31:49 } +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 258/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 4.744615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:53,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43479 samples/s/p 6:32:20 } +2024-07-25 18:34:56,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 260/ 1625], loss: 1.525, per_step_time: 1471ms, lr: 4.7815383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:56,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43687 samples/s/p 6:32:08 } +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 262/ 1625], loss: 1.477, per_step_time: 1472ms, lr: 4.8184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:34:59,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43366 samples/s/p 6:32:19 } +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 264/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 4.8553843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:02,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43094 samples/s/p 6:32:28 } +2024-07-25 18:35:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 266/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 4.8923075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43241 samples/s/p 6:32:18 } +2024-07-25 18:35:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 268/ 1625], loss: 1.425, per_step_time: 1472ms, lr: 4.9292303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.6% | | 5.43191 samples/s/p 6:32:17 } +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 270/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 4.9661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:10,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43530 samples/s/p 6:32:00 } +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 272/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 5.0030767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43460 samples/s/p 6:32:00 } +2024-07-25 18:35:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 274/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 5.04e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:16,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43173 samples/s/p 6:32:09 } +2024-07-25 18:35:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 276/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 5.0769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:19,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43442 samples/s/p 6:31:55 } +2024-07-25 18:35:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 278/ 1625], loss: 1.270, per_step_time: 1475ms, lr: 5.113846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.42350 samples/s/p 6:32:39 } +2024-07-25 18:35:25,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 280/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 5.150769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:25,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43494 samples/s/p 6:31:47 } +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 282/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 5.187692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:28,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43516 samples/s/p 6:31:43 } +2024-07-25 18:35:31,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 284/ 1625], loss: 1.393, per_step_time: 1472ms, lr: 5.2246155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:31,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.7% | | 5.43391 samples/s/p 6:31:45 } +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 286/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 5.2615383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:34,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43706 samples/s/p 6:31:29 } +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 288/ 1625], loss: 1.358, per_step_time: 1472ms, lr: 5.2984615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:37,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43478 samples/s/p 6:31:36 } +2024-07-25 18:35:40,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 290/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 5.3353842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:40,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43628 samples/s/p 6:31:26 } +2024-07-25 18:35:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 292/ 1625], loss: 1.333, per_step_time: 1474ms, lr: 5.3723074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42721 samples/s/p 6:32:02 } +2024-07-25 18:35:46,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 294/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 5.4092307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42709 samples/s/p 6:32:00 } +2024-07-25 18:35:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 296/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 5.446154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:49,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43311 samples/s/p 6:31:31 } +2024-07-25 18:35:52,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 298/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 5.4830766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:52,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.43311 samples/s/p 6:31:28 } +2024-07-25 18:35:55,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 300/ 1625], loss: 1.461, per_step_time: 1473ms, lr: 5.52e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:55,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.8% | | 5.42872 samples/s/p 6:31:44 } +2024-07-25 18:35:58,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 302/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 5.5569226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:35:58,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43856 samples/s/p 6:30:59 } +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 304/ 1625], loss: 1.507, per_step_time: 1472ms, lr: 5.593846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:01,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43322 samples/s/p 6:31:19 } +2024-07-25 18:36:04,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 306/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 5.630769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:04,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43720 samples/s/p 6:30:59 } +2024-07-25 18:36:06,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 308/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 5.667692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:06,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43644 samples/s/p 6:30:59 } +2024-07-25 18:36:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 310/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 5.704615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:09,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43677 samples/s/p 6:30:55 } +2024-07-25 18:36:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 312/ 1625], loss: 1.359, per_step_time: 1473ms, lr: 5.741538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:12,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43085 samples/s/p 6:31:17 } +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 314/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 5.778461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:15,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43733 samples/s/p 6:30:46 } +2024-07-25 18:36:18,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 316/ 1625], loss: 1.264, per_step_time: 1470ms, lr: 5.8153846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:18,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 1.9% | | 5.43879 samples/s/p 6:30:37 } +2024-07-25 18:36:21,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 318/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 5.8523074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:21,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43717 samples/s/p 6:30:41 } +2024-07-25 18:36:24,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 320/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 5.8892306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:24,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43226 samples/s/p 6:30:59 } +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 5.926154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:27,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43188 samples/s/p 6:30:58 } +2024-07-25 18:36:30,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 324/ 1625], loss: 1.425, per_step_time: 1470ms, lr: 5.9630765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:30,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% | | 5.43928 samples/s/p 6:30:23 } +2024-07-25 18:36:33,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 326/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 5.9999998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:33,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43902 samples/s/p 6:30:21 } +2024-07-25 18:36:36,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 328/ 1625], loss: 1.466, per_step_time: 1472ms, lr: 6.036923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43299 samples/s/p 6:30:44 } +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 330/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 6.073846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:39,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43704 samples/s/p 6:30:24 } +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 332/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 6.110769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.0% |█ | 5.43147 samples/s/p 6:30:45 } +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 334/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 6.147692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:45,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43390 samples/s/p 6:30:32 } +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 336/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 6.184615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:48,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43074 samples/s/p 6:30:42 } +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 338/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 6.221538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43612 samples/s/p 6:30:16 } +2024-07-25 18:36:54,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 340/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 6.2584613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:54,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.42781 samples/s/p 6:30:49 } +2024-07-25 18:36:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 342/ 1625], loss: 1.366, per_step_time: 1470ms, lr: 6.2953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:36:57,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43890 samples/s/p 6:29:58 } +2024-07-25 18:37:00,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 344/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 6.3323073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:00,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43066 samples/s/p 6:30:31 } +2024-07-25 18:37:03,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 346/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 6.3692305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:03,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43097 samples/s/p 6:30:27 } +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 348/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 6.4061533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:05,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.1% |█ | 5.43181 samples/s/p 6:30:20 } +2024-07-25 18:37:08,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 350/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 6.443077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:08,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43737 samples/s/p 6:29:53 } +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 352/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 6.4799997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:11,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43299 samples/s/p 6:30:09 } +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 354/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 6.516923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:14,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42775 samples/s/p 6:30:29 } +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 356/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 6.5538457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:17,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43838 samples/s/p 6:29:40 } +2024-07-25 18:37:20,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 358/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 6.590769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:20,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43403 samples/s/p 6:29:56 } +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 360/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 6.6276916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:23,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42568 samples/s/p 6:30:29 } +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 362/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 6.6646153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:26,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.43450 samples/s/p 6:29:48 } +2024-07-25 18:37:29,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 364/ 1625], loss: 1.370, per_step_time: 1474ms, lr: 6.7015385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:29,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.2% |█ | 5.42637 samples/s/p 6:30:20 } +2024-07-25 18:37:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 366/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 6.7384613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:32,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43816 samples/s/p 6:29:26 } +2024-07-25 18:37:35,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 368/ 1625], loss: 1.162, per_step_time: 1474ms, lr: 6.7753845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:35,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.42720 samples/s/p 6:30:10 } +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 370/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 6.812307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:38,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43895 samples/s/p 6:29:17 } +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 372/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 6.8492304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43627 samples/s/p 6:29:26 } +2024-07-25 18:37:44,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 374/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 6.8861536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:44,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43633 samples/s/p 6:29:22 } +2024-07-25 18:37:47,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 376/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 6.923077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:47,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43762 samples/s/p 6:29:14 } +2024-07-25 18:37:50,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 378/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.9599996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:50,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43455 samples/s/p 6:29:24 } +2024-07-25 18:37:53,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 380/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 6.996923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:53,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.3% |█ | 5.43775 samples/s/p 6:29:07 } +2024-07-25 18:37:56,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 382/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 7.0338456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:56,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42971 samples/s/p 6:29:39 } +2024-07-25 18:37:59,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 384/ 1625], loss: 1.384, per_step_time: 1473ms, lr: 7.0707692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:37:59,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42845 samples/s/p 6:29:41 } +2024-07-25 18:38:02,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 386/ 1625], loss: 1.272, per_step_time: 1475ms, lr: 7.107692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:02,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42367 samples/s/p 6:29:59 } +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 388/ 1625], loss: 1.170, per_step_time: 1483ms, lr: 7.144615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:05,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.39268 samples/s/p 6:32:11 } +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 390/ 1625], loss: 1.440, per_step_time: 1471ms, lr: 7.181538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:07,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43632 samples/s/p 6:28:59 } +2024-07-25 18:38:10,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 392/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 7.218461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:10,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43729 samples/s/p 6:28:52 } +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 394/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 7.255384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:13,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.43065 samples/s/p 6:29:17 } +2024-07-25 18:38:16,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 396/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 7.2923076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:16,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.42836 samples/s/p 6:29:24 } +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 398/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 7.3292304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:19,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.4% |█ | 5.44083 samples/s/p 6:28:28 } +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 400/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 7.3661536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:22,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.42923 samples/s/p 6:29:15 } +2024-07-25 18:38:25,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 402/ 1625], loss: 1.334, per_step_time: 1474ms, lr: 7.4030763e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:25,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.42501 samples/s/p 6:29:30 } +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 404/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 7.4399995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:28,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43539 samples/s/p 6:28:42 } +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 406/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 7.4769227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:31,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43994 samples/s/p 6:28:20 } +2024-07-25 18:38:34,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 408/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 7.5138464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:34,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43264 samples/s/p 6:28:48 } +2024-07-25 18:38:37,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 410/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 7.5507687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:37,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43432 samples/s/p 6:28:38 } +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 412/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 7.587692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:40,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43567 samples/s/p 6:28:29 } +2024-07-25 18:38:43,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 414/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 7.624615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.5% |█ | 5.43913 samples/s/p 6:28:11 } +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 416/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 7.661539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43938 samples/s/p 6:28:07 } +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 418/ 1625], loss: 1.314, per_step_time: 1470ms, lr: 7.698461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:49,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44165 samples/s/p 6:27:55 } +2024-07-25 18:38:52,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 420/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 7.735384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:52,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43611 samples/s/p 6:28:16 } +2024-07-25 18:38:55,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 422/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 7.772307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:55,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.43972 samples/s/p 6:27:57 } +2024-07-25 18:38:58,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 424/ 1625], loss: 1.187, per_step_time: 1474ms, lr: 7.809231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:38:58,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.42439 samples/s/p 6:29:00 } +2024-07-25 18:39:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 426/ 1625], loss: 1.136, per_step_time: 1477ms, lr: 7.8461535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.41425 samples/s/p 6:29:41 } +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 428/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 7.883076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:04,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.42982 samples/s/p 6:28:31 } +2024-07-25 18:39:07,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 430/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.92e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:07,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.6% |█ | 5.44310 samples/s/p 6:27:31 } +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 432/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 7.956923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:09,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43043 samples/s/p 6:28:22 } +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 434/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 7.993845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:12,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43911 samples/s/p 6:27:42 } +2024-07-25 18:39:15,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 436/ 1625], loss: 1.290, per_step_time: 1470ms, lr: 8.030769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:15,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.44124 samples/s/p 6:27:30 } +2024-07-25 18:39:18,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 438/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 8.067692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:18,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43463 samples/s/p 6:27:55 } +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 440/ 1625], loss: 1.366, per_step_time: 1471ms, lr: 8.1046155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43589 samples/s/p 6:27:47 } +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 442/ 1625], loss: 1.638, per_step_time: 1472ms, lr: 8.141537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:24,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43458 samples/s/p 6:27:50 } +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 444/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.178461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:27,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43740 samples/s/p 6:27:35 } +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 446/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 8.215385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:30,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.7% |█ | 5.43697 samples/s/p 6:27:34 } +2024-07-25 18:39:33,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 448/ 1625], loss: 1.467, per_step_time: 1472ms, lr: 8.252307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:33,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43150 samples/s/p 6:27:54 } +2024-07-25 18:39:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 450/ 1625], loss: 1.318, per_step_time: 1473ms, lr: 8.289231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42901 samples/s/p 6:28:02 } +2024-07-25 18:39:39,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 452/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 8.326153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:39,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.44038 samples/s/p 6:27:10 } +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 454/ 1625], loss: 1.189, per_step_time: 1482ms, lr: 8.363077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:42,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.39796 samples/s/p 6:30:10 } +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 456/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.399999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:45,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43277 samples/s/p 6:27:37 } +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 458/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 8.436923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:48,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.42818 samples/s/p 6:27:54 } +2024-07-25 18:39:51,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 460/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 8.473846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:51,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43466 samples/s/p 6:27:23 } +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 462/ 1625], loss: 1.141, per_step_time: 1473ms, lr: 8.510769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:54,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.8% |█ | 5.43061 samples/s/p 6:27:37 } +2024-07-25 18:39:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 464/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 8.547692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:39:57,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43746 samples/s/p 6:27:05 } +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 466/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 8.584615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43691 samples/s/p 6:27:04 } +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 468/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 8.621538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43708 samples/s/p 6:27:01 } +2024-07-25 18:40:06,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 470/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.658461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:06,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43702 samples/s/p 6:26:58 } +2024-07-25 18:40:09,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 472/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 8.695384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:09,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43263 samples/s/p 6:27:14 } +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 474/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 8.732308e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:11,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.43561 samples/s/p 6:26:58 } +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 476/ 1625], loss: 1.107, per_step_time: 1475ms, lr: 8.76923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:14,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42027 samples/s/p 6:28:01 } +2024-07-25 18:40:17,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 478/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 8.806153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:17,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 2.9% |█ | 5.42959 samples/s/p 6:27:18 } +2024-07-25 18:40:20,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 480/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 8.843077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:20,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.44005 samples/s/p 6:26:30 } +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 482/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 8.88e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:23,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43323 samples/s/p 6:26:57 } +2024-07-25 18:40:26,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 484/ 1625], loss: 1.342, per_step_time: 1477ms, lr: 8.9169225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:26,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.41543 samples/s/p 6:28:10 } +2024-07-25 18:40:29,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 486/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 8.953845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:29,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43861 samples/s/p 6:26:28 } +2024-07-25 18:40:32,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 488/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.990769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:32,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43118 samples/s/p 6:26:57 } +2024-07-25 18:40:35,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 490/ 1625], loss: 1.332, per_step_time: 1470ms, lr: 9.027692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:35,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43848 samples/s/p 6:26:22 } +2024-07-25 18:40:38,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 492/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.064615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:38,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43161 samples/s/p 6:26:49 } +2024-07-25 18:40:41,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 494/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.101538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:41,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.0% |█ | 5.43634 samples/s/p 6:26:26 } +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 496/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 9.138461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:44,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43756 samples/s/p 6:26:18 } +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 498/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.175385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:47,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43250 samples/s/p 6:26:36 } +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 500/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 9.212307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:50,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43471 samples/s/p 6:26:24 } +2024-07-25 18:40:53,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 502/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 9.24923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:53,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43143 samples/s/p 6:26:35 } +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 504/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 9.286154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:56,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.42997 samples/s/p 6:26:38 } +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 506/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 9.3230765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:40:59,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43442 samples/s/p 6:26:16 } +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 508/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 9.36e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:02,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43846 samples/s/p 6:25:56 } +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 510/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 9.396922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:05,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.1% |█ | 5.43763 samples/s/p 6:25:57 } +2024-07-25 18:41:08,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 512/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 9.433846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:08,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.44140 samples/s/p 6:25:38 } +2024-07-25 18:41:11,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 514/ 1625], loss: 1.214, per_step_time: 1482ms, lr: 9.470769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:11,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.39499 samples/s/p 6:28:54 } +2024-07-25 18:41:13,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 516/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 9.507692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:13,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43330 samples/s/p 6:26:06 } +2024-07-25 18:41:16,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 518/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 9.544615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:16,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43997 samples/s/p 6:25:35 } +2024-07-25 18:41:19,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 520/ 1625], loss: 1.191, per_step_time: 1475ms, lr: 9.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:19,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.42006 samples/s/p 6:26:57 } +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 522/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 9.618461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:22,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43395 samples/s/p 6:25:55 } +2024-07-25 18:41:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 524/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 9.655385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:25,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43531 samples/s/p 6:25:46 } +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 526/ 1625], loss: 1.433, per_step_time: 1471ms, lr: 9.692307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:28,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43519 samples/s/p 6:25:44 } +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 528/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 9.72923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:31,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.2% |█ | 5.43901 samples/s/p 6:25:24 } +2024-07-25 18:41:34,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 530/ 1625], loss: 1.409, per_step_time: 1470ms, lr: 9.766153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:34,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43858 samples/s/p 6:25:23 } +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 532/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 9.803077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:37,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43903 samples/s/p 6:25:18 } +2024-07-25 18:41:40,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 534/ 1625], loss: 1.323, per_step_time: 1470ms, lr: 9.839999e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:40,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.44177 samples/s/p 6:25:04 } +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 536/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 9.876922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:43,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43505 samples/s/p 6:25:29 } +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 538/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 9.913846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:46,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43277 samples/s/p 6:25:36 } +2024-07-25 18:41:49,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 540/ 1625], loss: 1.340, per_step_time: 1470ms, lr: 9.950769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:49,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43923 samples/s/p 6:25:06 } +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 542/ 1625], loss: 1.315, per_step_time: 1475ms, lr: 9.9876925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:52,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.42216 samples/s/p 6:26:15 } +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 544/ 1625], loss: 1.386, per_step_time: 1472ms, lr: 1.0024614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:55,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.3% |█ | 5.43276 samples/s/p 6:25:27 } +2024-07-25 18:41:58,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 546/ 1625], loss: 1.357, per_step_time: 1472ms, lr: 1.0061538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:41:58,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43143 samples/s/p 6:25:30 } +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 548/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.0098462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:01,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43236 samples/s/p 6:25:23 } +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 550/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.0135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:04,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43394 samples/s/p 6:25:13 } +2024-07-25 18:42:07,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 552/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.0172307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:07,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43565 samples/s/p 6:25:03 } +2024-07-25 18:42:10,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 554/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.020923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:10,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43502 samples/s/p 6:25:03 } +2024-07-25 18:42:12,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 556/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 1.0246154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:13,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43142 samples/s/p 6:25:15 } +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 558/ 1625], loss: 1.404, per_step_time: 1472ms, lr: 1.0283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:15,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43155 samples/s/p 6:25:12 } +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 560/ 1625], loss: 1.367, per_step_time: 1472ms, lr: 1.0319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:18,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.4% |█ | 5.43155 samples/s/p 6:25:09 } +2024-07-25 18:42:21,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 562/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.0356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:21,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43356 samples/s/p 6:24:57 } +2024-07-25 18:42:24,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 564/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 1.03938455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:24,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.44003 samples/s/p 6:24:27 } +2024-07-25 18:42:27,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 566/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.0430769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:27,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43942 samples/s/p 6:24:27 } +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 568/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:30,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43587 samples/s/p 6:24:39 } +2024-07-25 18:42:33,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 570/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:33,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43307 samples/s/p 6:24:48 } +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 572/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 1.0541538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42751 samples/s/p 6:25:08 } +2024-07-25 18:42:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 574/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.0578461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:39,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.43190 samples/s/p 6:24:47 } +2024-07-25 18:42:42,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 576/ 1625], loss: 1.260, per_step_time: 1474ms, lr: 1.0615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:42,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.5% |█ | 5.42722 samples/s/p 6:25:04 } +2024-07-25 18:42:45,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 578/ 1625], loss: 1.248, per_step_time: 1475ms, lr: 1.0652307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:45,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42097 samples/s/p 6:25:27 } +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 580/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.068923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:48,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43355 samples/s/p 6:24:31 } +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 582/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.0726154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:51,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43416 samples/s/p 6:24:25 } +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 584/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.0763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:54,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43440 samples/s/p 6:24:21 } +2024-07-25 18:42:57,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 586/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.07999995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:42:57,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43820 samples/s/p 6:24:02 } +2024-07-25 18:43:00,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 588/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0836922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:00,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43573 samples/s/p 6:24:10 } +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 590/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 1.0873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:03,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.42981 samples/s/p 6:24:32 } +2024-07-25 18:43:06,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 592/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.091077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:06,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.6% |█ | 5.43538 samples/s/p 6:24:06 } +2024-07-25 18:43:09,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 594/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 1.0947691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:09,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43262 samples/s/p 6:24:14 } +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 596/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.0984615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:12,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42805 samples/s/p 6:24:31 } +2024-07-25 18:43:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 598/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.1021538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:14,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43495 samples/s/p 6:23:59 } +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 600/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.10584615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:17,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.42842 samples/s/p 6:24:23 } +2024-07-25 18:43:20,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 602/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.1095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:20,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43565 samples/s/p 6:23:50 } +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 604/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.1132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:23,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43782 samples/s/p 6:23:38 } +2024-07-25 18:43:26,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 606/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.1169231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:26,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43735 samples/s/p 6:23:37 } +2024-07-25 18:43:29,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 608/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 1.1206153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:29,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.7% |█ | 5.43559 samples/s/p 6:23:41 } +2024-07-25 18:43:32,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 610/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.1243076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:32,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43688 samples/s/p 6:23:33 } +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 612/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 1.1279999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:35,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43426 samples/s/p 6:23:41 } +2024-07-25 18:43:38,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 614/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.1316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:38,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43397 samples/s/p 6:23:39 } +2024-07-25 18:43:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 616/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1353846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:41,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43567 samples/s/p 6:23:29 } +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 618/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.1390768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:44,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43820 samples/s/p 6:23:15 } +2024-07-25 18:43:47,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 620/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.1427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:47,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43203 samples/s/p 6:23:39 } +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 622/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 1.14646145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:50,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.43369 samples/s/p 6:23:29 } +2024-07-25 18:43:53,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 624/ 1625], loss: 1.160, per_step_time: 1475ms, lr: 1.1501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:53,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.8% |█ | 5.42301 samples/s/p 6:24:11 } +2024-07-25 18:43:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 626/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.1538462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44171 samples/s/p 6:22:49 } +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 628/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.1575384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:43:59,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43414 samples/s/p 6:23:18 } +2024-07-25 18:44:02,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 630/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 1.1612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:02,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43172 samples/s/p 6:23:25 } +2024-07-25 18:44:05,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 632/ 1625], loss: 1.094, per_step_time: 1476ms, lr: 1.164923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:05,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.41980 samples/s/p 6:24:13 } +2024-07-25 18:44:08,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 634/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.1686154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:08,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43487 samples/s/p 6:23:06 } +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 636/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.1723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:11,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43220 samples/s/p 6:23:14 } +2024-07-25 18:44:14,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 638/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1759999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:14,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.43495 samples/s/p 6:23:00 } +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 640/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.1796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:16,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 3.9% |█ | 5.44118 samples/s/p 6:22:30 } +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 642/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.1833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:19,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43477 samples/s/p 6:22:55 } +2024-07-25 18:44:22,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 644/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 1.18707685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:22,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43173 samples/s/p 6:23:04 } +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 646/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 1.1907691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:25,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.44001 samples/s/p 6:22:26 } +2024-07-25 18:44:28,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 648/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 1.1944615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:28,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |█ | 5.43704 samples/s/p 6:22:36 } +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 650/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.1981539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:31,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43590 samples/s/p 6:22:38 } +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 652/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.201846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:34,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43020 samples/s/p 6:22:59 } +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 654/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.2055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:37,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43391 samples/s/p 6:22:41 } +2024-07-25 18:44:40,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 656/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.2092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:40,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43516 samples/s/p 6:22:32 } +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 658/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.21292305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:43,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.0% |██ | 5.43322 samples/s/p 6:22:38 } +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 660/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 1.2166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:46,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43861 samples/s/p 6:22:12 } +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 662/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.2203076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:49,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42956 samples/s/p 6:22:47 } +2024-07-25 18:44:52,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 664/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 1.224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:52,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.44185 samples/s/p 6:21:52 } +2024-07-25 18:44:55,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 666/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.22769225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:55,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.42806 samples/s/p 6:22:48 } +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 668/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.2313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:44:58,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43363 samples/s/p 6:22:21 } +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 670/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2350769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:01,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43323 samples/s/p 6:22:20 } +2024-07-25 18:45:04,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 672/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.2387692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:04,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43169 samples/s/p 6:22:23 } +2024-07-25 18:45:07,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 674/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.2424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:07,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.1% |██ | 5.43575 samples/s/p 6:22:03 } +2024-07-25 18:45:10,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 676/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.2461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:10,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43196 samples/s/p 6:22:16 } +2024-07-25 18:45:13,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 678/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2498461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:13,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43256 samples/s/p 6:22:11 } +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 680/ 1625], loss: 1.174, per_step_time: 1481ms, lr: 1.2535384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.39987 samples/s/p 6:24:27 } +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 682/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 1.2572307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:18,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43999 samples/s/p 6:21:34 } +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 684/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.2609231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:21,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43871 samples/s/p 6:21:36 } +2024-07-25 18:45:24,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 686/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:24,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43911 samples/s/p 6:21:31 } +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 688/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.2683076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43441 samples/s/p 6:21:48 } +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 690/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.2719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:30,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.2% |██ | 5.43545 samples/s/p 6:21:41 } +2024-07-25 18:45:33,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 692/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.2756923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:33,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43830 samples/s/p 6:21:26 } +2024-07-25 18:45:36,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 694/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.2793846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:36,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42927 samples/s/p 6:22:01 } +2024-07-25 18:45:39,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 696/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 1.2830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:39,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43632 samples/s/p 6:21:28 } +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 698/ 1625], loss: 1.554, per_step_time: 1473ms, lr: 1.2867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:42,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.42959 samples/s/p 6:21:54 } +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 700/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.2904615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:45,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43753 samples/s/p 6:21:18 } +2024-07-25 18:45:48,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 702/ 1625], loss: 1.271, per_step_time: 1470ms, lr: 1.29415375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:48,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43976 samples/s/p 6:21:05 } +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 704/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.2978461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:51,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43157 samples/s/p 6:21:37 } +2024-07-25 18:45:54,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 706/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:54,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.3% |██ | 5.43559 samples/s/p 6:21:17 } +2024-07-25 18:45:57,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 708/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 1.3052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:45:57,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42852 samples/s/p 6:21:44 } +2024-07-25 18:46:00,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 710/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.308923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:00,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43412 samples/s/p 6:21:17 } +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 712/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 1.3126153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:03,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43138 samples/s/p 6:21:26 } +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 714/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 1.3163076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:06,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43170 samples/s/p 6:21:21 } +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 716/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.32e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:09,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43564 samples/s/p 6:21:02 } +2024-07-25 18:46:12,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 718/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.3236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:12,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43670 samples/s/p 6:20:55 } +2024-07-25 18:46:15,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 720/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 1.3273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:15,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.42642 samples/s/p 6:21:35 } +2024-07-25 18:46:17,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 722/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.3310769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:17,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.4% |██ | 5.43023 samples/s/p 6:21:16 } +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 724/ 1625], loss: 1.268, per_step_time: 1474ms, lr: 1.33476915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:20,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.42694 samples/s/p 6:21:27 } +2024-07-25 18:46:23,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 726/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.3384615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:23,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43682 samples/s/p 6:20:42 } +2024-07-25 18:46:26,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 728/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.3421538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:26,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43837 samples/s/p 6:20:33 } +2024-07-25 18:46:29,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 730/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 1.3458461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:29,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43832 samples/s/p 6:20:30 } +2024-07-25 18:46:32,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 732/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3495384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:32,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43019 samples/s/p 6:21:01 } +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 734/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.3532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:35,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43573 samples/s/p 6:20:35 } +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 736/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.356923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:38,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43607 samples/s/p 6:20:31 } +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 738/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.36061535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:41,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.5% |██ | 5.43319 samples/s/p 6:20:40 } +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 740/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.3643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:44,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.42983 samples/s/p 6:20:51 } +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 742/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:47,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43833 samples/s/p 6:20:12 } +2024-07-25 18:46:50,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 744/ 1625], loss: 1.380, per_step_time: 1472ms, lr: 1.3716922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:50,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43255 samples/s/p 6:20:34 } +2024-07-25 18:46:53,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 746/ 1625], loss: 1.155, per_step_time: 1469ms, lr: 1.3753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:53,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.44219 samples/s/p 6:19:50 } +2024-07-25 18:46:56,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 748/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.3790768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:56,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43234 samples/s/p 6:20:29 } +2024-07-25 18:46:59,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 750/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3827692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:46:59,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43544 samples/s/p 6:20:13 } +2024-07-25 18:47:02,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 752/ 1625], loss: 0.935, per_step_time: 1471ms, lr: 1.38646155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:02,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43804 samples/s/p 6:19:59 } +2024-07-25 18:47:05,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 754/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 1.3901537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:05,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.6% |██ | 5.43851 samples/s/p 6:19:54 } +2024-07-25 18:47:08,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 756/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 1.3938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:08,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43648 samples/s/p 6:20:00 } +2024-07-25 18:47:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 758/ 1625], loss: 1.241, per_step_time: 1480ms, lr: 1.3975384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.40347 samples/s/p 6:22:16 } +2024-07-25 18:47:14,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 760/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.40123075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.44043 samples/s/p 6:19:37 } +2024-07-25 18:47:17,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 762/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.404923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:17,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43281 samples/s/p 6:20:06 } +2024-07-25 18:47:19,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 764/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 1.4086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:19,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43459 samples/s/p 6:19:56 } +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 766/ 1625], loss: 1.412, per_step_time: 1472ms, lr: 1.4123077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:22,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43410 samples/s/p 6:19:55 } +2024-07-25 18:47:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 768/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.4159999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.43172 samples/s/p 6:20:02 } +2024-07-25 18:47:28,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 770/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.4196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:28,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.7% |██ | 5.42704 samples/s/p 6:20:19 } +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 772/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.4233846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:31,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43224 samples/s/p 6:19:54 } +2024-07-25 18:47:34,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 774/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 1.4270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:34,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43358 samples/s/p 6:19:45 } +2024-07-25 18:47:37,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 776/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 1.4307692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:37,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.42385 samples/s/p 6:20:23 } +2024-07-25 18:47:40,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 778/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 1.4344614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:40,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43288 samples/s/p 6:19:42 } +2024-07-25 18:47:43,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 780/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.4381538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:43,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43830 samples/s/p 6:19:17 } +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 782/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 1.44184605e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:46,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43404 samples/s/p 6:19:32 } +2024-07-25 18:47:49,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 784/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.4455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:49,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43650 samples/s/p 6:19:18 } +2024-07-25 18:47:52,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 786/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:52,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.43163 samples/s/p 6:19:36 } +2024-07-25 18:47:55,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 788/ 1625], loss: 1.232, per_step_time: 1477ms, lr: 1.452923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:55,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.8% |██ | 5.41461 samples/s/p 6:20:44 } +2024-07-25 18:47:58,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 790/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.4566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:47:58,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43330 samples/s/p 6:19:23 } +2024-07-25 18:48:01,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 792/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.4603076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:01,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43433 samples/s/p 6:19:16 } +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 794/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 1.464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:04,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44152 samples/s/p 6:18:43 } +2024-07-25 18:48:07,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 796/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.4676923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43171 samples/s/p 6:19:21 } +2024-07-25 18:48:10,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 798/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 1.4713845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:10,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43198 samples/s/p 6:19:17 } +2024-07-25 18:48:13,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 800/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 1.4750769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:13,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.44159 samples/s/p 6:18:33 } +2024-07-25 18:48:16,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 802/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.4787692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:16,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.43099 samples/s/p 6:19:15 } +2024-07-25 18:48:19,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 804/ 1625], loss: 1.271, per_step_time: 1474ms, lr: 1.48246145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:19,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 4.9% |██ | 5.42727 samples/s/p 6:19:27 } +2024-07-25 18:48:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 806/ 1625], loss: 1.011, per_step_time: 1470ms, lr: 1.4861538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:21,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43921 samples/s/p 6:18:35 } +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 808/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4898461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:24,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43415 samples/s/p 6:18:53 } +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 810/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 1.4935385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:27,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43336 samples/s/p 6:18:53 } +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 812/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.4972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:30,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43454 samples/s/p 6:18:45 } +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 814/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.500923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:33,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.43685 samples/s/p 6:18:33 } +2024-07-25 18:48:36,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 816/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5046153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:36,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.44067 samples/s/p 6:18:14 } +2024-07-25 18:48:39,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 818/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.50830765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:39,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42881 samples/s/p 6:19:00 } +2024-07-25 18:48:42,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 820/ 1625], loss: 1.276, per_step_time: 1474ms, lr: 1.512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:42,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.0% |██ | 5.42738 samples/s/p 6:19:03 } +2024-07-25 18:48:45,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 822/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5156923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:45,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43564 samples/s/p 6:18:26 } +2024-07-25 18:48:48,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 824/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5193845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:48,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42933 samples/s/p 6:18:49 } +2024-07-25 18:48:51,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 826/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.52307675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:51,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.44014 samples/s/p 6:18:01 } +2024-07-25 18:48:54,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 828/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 1.5267691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:54,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43059 samples/s/p 6:18:38 } +2024-07-25 18:48:57,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 830/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.5304615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:48:57,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43479 samples/s/p 6:18:18 } +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 832/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.5341539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:00,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43035 samples/s/p 6:18:33 } +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 834/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.537846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:03,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.43826 samples/s/p 6:17:57 } +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 836/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.5415384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:06,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.1% |██ | 5.42912 samples/s/p 6:18:33 } +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 838/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5452308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:09,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43634 samples/s/p 6:17:59 } +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 840/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.5489231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:12,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43286 samples/s/p 6:18:11 } +2024-07-25 18:49:15,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 842/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.5526153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:15,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43924 samples/s/p 6:17:41 } +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 844/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.5563075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:18,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43568 samples/s/p 6:17:53 } +2024-07-25 18:49:21,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 846/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.5599999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:21,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43792 samples/s/p 6:17:41 } +2024-07-25 18:49:23,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 848/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 1.5636922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:23,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43869 samples/s/p 6:17:35 } +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 850/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5673846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:26,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.43501 samples/s/p 6:17:47 } +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 852/ 1625], loss: 1.398, per_step_time: 1470ms, lr: 1.571077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:29,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.2% |██ | 5.44006 samples/s/p 6:17:23 } +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 854/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.5747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:32,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43199 samples/s/p 6:17:54 } +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 856/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 1.5784615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:35,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42605 samples/s/p 6:18:16 } +2024-07-25 18:49:38,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 858/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 1.5821537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:38,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44137 samples/s/p 6:17:09 } +2024-07-25 18:49:41,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 860/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.585846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:41,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.44528 samples/s/p 6:16:50 } +2024-07-25 18:49:44,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 862/ 1625], loss: 1.296, per_step_time: 1479ms, lr: 1.5895384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:44,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.40689 samples/s/p 6:19:27 } +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 864/ 1625], loss: 1.288, per_step_time: 1473ms, lr: 1.5932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:47,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.42826 samples/s/p 6:17:55 } +2024-07-25 18:49:50,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 866/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:50,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43319 samples/s/p 6:17:31 } +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 868/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6006154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:53,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.3% |██ | 5.43543 samples/s/p 6:17:19 } +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 870/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.6043077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:56,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43876 samples/s/p 6:17:02 } +2024-07-25 18:49:59,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 872/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:49:59,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43383 samples/s/p 6:17:20 } +2024-07-25 18:50:02,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 874/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.6116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:02,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43438 samples/s/p 6:17:15 } +2024-07-25 18:50:05,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.6153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:05,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43996 samples/s/p 6:16:48 } +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 878/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.6190768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:08,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.42815 samples/s/p 6:17:35 } +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 880/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.6227692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:11,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43033 samples/s/p 6:17:23 } +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 882/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:14,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.44089 samples/s/p 6:16:36 } +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 884/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.6301537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:17,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.4% |██ | 5.43222 samples/s/p 6:17:09 } +2024-07-25 18:50:20,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 886/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.6338461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:20,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.44169 samples/s/p 6:16:27 } +2024-07-25 18:50:22,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 888/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.6375385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:22,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42890 samples/s/p 6:17:17 } +2024-07-25 18:50:25,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 890/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.6412308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:25,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43510 samples/s/p 6:16:48 } +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 892/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.6449228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:28,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43710 samples/s/p 6:16:37 } +2024-07-25 18:50:31,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 894/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.6486152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:31,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43234 samples/s/p 6:16:54 } +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 896/ 1625], loss: 1.447, per_step_time: 1474ms, lr: 1.6523076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:34,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.42400 samples/s/p 6:17:26 } +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 898/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 1.656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:37,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43489 samples/s/p 6:16:37 } +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 900/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.6596923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:40,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.5% |██ | 5.43457 samples/s/p 6:16:36 } +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 902/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:43,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43434 samples/s/p 6:16:34 } +2024-07-25 18:50:46,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 904/ 1625], loss: 1.327, per_step_time: 1470ms, lr: 1.6670769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:46,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43891 samples/s/p 6:16:12 } +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 906/ 1625], loss: 1.376, per_step_time: 1470ms, lr: 1.6707692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:49,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43986 samples/s/p 6:16:05 } +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 908/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6744614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:52,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43809 samples/s/p 6:16:09 } +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 910/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:55,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43373 samples/s/p 6:16:24 } +2024-07-25 18:50:58,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 912/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.681846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:50:58,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43653 samples/s/p 6:16:10 } +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 914/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.6855383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:01,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43924 samples/s/p 6:15:56 } +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 916/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.6892307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:04,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43157 samples/s/p 6:16:25 } +2024-07-25 18:51:07,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 918/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.692923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:07,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.6% |██ | 5.43559 samples/s/p 6:16:05 } +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 920/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.6966154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:10,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43277 samples/s/p 6:16:14 } +2024-07-25 18:51:13,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 922/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 1.7003076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:13,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43488 samples/s/p 6:16:02 } +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 924/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:16,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43026 samples/s/p 6:16:18 } +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 926/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.7076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:19,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43813 samples/s/p 6:15:43 } +2024-07-25 18:51:22,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 928/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.7113845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:22,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43535 samples/s/p 6:15:51 } +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 930/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 1.7150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:24,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43999 samples/s/p 6:15:29 } +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 932/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.718769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:27,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43961 samples/s/p 6:15:28 } +2024-07-25 18:51:30,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 934/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 1.7224615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:30,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.7% |██ | 5.43724 samples/s/p 6:15:34 } +2024-07-25 18:51:33,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 936/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.7261538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:33,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43351 samples/s/p 6:15:47 } +2024-07-25 18:51:36,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 938/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.7298462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:36,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43049 samples/s/p 6:15:57 } +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 940/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 1.7335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:39,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43506 samples/s/p 6:15:35 } +2024-07-25 18:51:42,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 942/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.7372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:42,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43766 samples/s/p 6:15:21 } +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 944/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.740923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:45,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43546 samples/s/p 6:15:27 } +2024-07-25 18:51:48,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 946/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.7446153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:48,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.43521 samples/s/p 6:15:25 } +2024-07-25 18:51:51,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 948/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 1.7483077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:51,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42768 samples/s/p 6:15:54 } +2024-07-25 18:51:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 950/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.7519998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:54,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.8% |██ | 5.42768 samples/s/p 6:15:51 } +2024-07-25 18:51:57,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 952/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 1.7556922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:51:57,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.44017 samples/s/p 6:14:56 } +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 954/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.7593846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:00,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43298 samples/s/p 6:15:23 } +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 956/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.763077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:03,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43828 samples/s/p 6:14:58 } +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 958/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.7667691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:06,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43516 samples/s/p 6:15:08 } +2024-07-25 18:52:09,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 960/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.7704613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:09,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.42992 samples/s/p 6:15:27 } +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 962/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 1.7741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43799 samples/s/p 6:14:50 } +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 964/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.777846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:15,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43264 samples/s/p 6:15:09 } +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 966/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.7815384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:18,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 5.9% |██ | 5.43491 samples/s/p 6:14:57 } +2024-07-25 18:52:21,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 968/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.7852308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:21,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43648 samples/s/p 6:14:48 } +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 970/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 1.788923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:23,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43225 samples/s/p 6:15:02 } +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 972/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 1.7926153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:26,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.42923 samples/s/p 6:15:12 } +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 974/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.7963077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |██ | 5.43099 samples/s/p 6:15:01 } +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 976/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.7999999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:32,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.43026 samples/s/p 6:15:02 } +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1469ms, lr: 1.8036922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:35,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.44321 samples/s/p 6:14:05 } +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 980/ 1625], loss: 1.142, per_step_time: 1482ms, lr: 1.8073844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.39601 samples/s/p 6:17:18 } +2024-07-25 18:52:41,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 982/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 1.8110768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:41,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.0% |███ | 5.42871 samples/s/p 6:14:59 } +2024-07-25 18:52:44,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 984/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.8147692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:44,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43396 samples/s/p 6:14:34 } +2024-07-25 18:52:47,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 986/ 1625], loss: 1.310, per_step_time: 1470ms, lr: 1.8184615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.44006 samples/s/p 6:14:06 } +2024-07-25 18:52:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 988/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 1.8221539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:50,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43463 samples/s/p 6:14:26 } +2024-07-25 18:52:53,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 990/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.825846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43309 samples/s/p 6:14:29 } +2024-07-25 18:52:56,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 992/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.8295383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:56,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43372 samples/s/p 6:14:24 } +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 994/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.8332306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:52:59,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43762 samples/s/p 6:14:05 } +2024-07-25 18:53:02,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 996/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:02,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.42991 samples/s/p 6:14:34 } +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 998/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.8406154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:05,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.1% |███ | 5.43589 samples/s/p 6:14:06 } +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1000/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.8443076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:08,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43818 samples/s/p 6:13:53 } +2024-07-25 18:53:11,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1002/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:11,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43321 samples/s/p 6:14:11 } +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1004/ 1625], loss: 1.311, per_step_time: 1474ms, lr: 1.8516923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:14,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.42656 samples/s/p 6:14:36 } +2024-07-25 18:53:17,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1006/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.8553847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:17,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43226 samples/s/p 6:14:09 } +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1008/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.859077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:20,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43303 samples/s/p 6:14:03 } +2024-07-25 18:53:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1010/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 1.862769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:23,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.43539 samples/s/p 6:13:50 } +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1012/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 1.8664614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:25,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.44064 samples/s/p 6:13:26 } +2024-07-25 18:53:28,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1014/ 1625], loss: 1.070, per_step_time: 1469ms, lr: 1.8701538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:28,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.2% |███ | 5.44266 samples/s/p 6:13:14 } +2024-07-25 18:53:31,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1016/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.8738461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:31,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43786 samples/s/p 6:13:31 } +2024-07-25 18:53:34,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1018/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.8775383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:34,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43162 samples/s/p 6:13:54 } +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1020/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.8812307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:37,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43614 samples/s/p 6:13:32 } +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1022/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.884923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:40,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43060 samples/s/p 6:13:52 } +2024-07-25 18:53:43,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1024/ 1625], loss: 1.329, per_step_time: 1473ms, lr: 1.8886154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43043 samples/s/p 6:13:50 } +2024-07-25 18:53:46,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1026/ 1625], loss: 1.394, per_step_time: 1470ms, lr: 1.8923076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:46,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.44102 samples/s/p 6:13:04 } +2024-07-25 18:53:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1028/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.8959998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43793 samples/s/p 6:13:13 } +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1030/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.8996921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:52,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.3% |███ | 5.43498 samples/s/p 6:13:23 } +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1032/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 1.9033845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:55,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43460 samples/s/p 6:13:21 } +2024-07-25 18:53:58,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1034/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.9070769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:53:58,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43659 samples/s/p 6:13:10 } +2024-07-25 18:54:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1036/ 1625], loss: 1.235, per_step_time: 1477ms, lr: 1.9107692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:01,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.41581 samples/s/p 6:14:33 } +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1038/ 1625], loss: 1.303, per_step_time: 1475ms, lr: 1.9144614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:04,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42365 samples/s/p 6:13:58 } +2024-07-25 18:54:07,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1040/ 1625], loss: 1.367, per_step_time: 1473ms, lr: 1.9181538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:07,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42976 samples/s/p 6:13:29 } +2024-07-25 18:54:10,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1042/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.921846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:10,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43117 samples/s/p 6:13:21 } +2024-07-25 18:54:13,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1044/ 1625], loss: 1.122, per_step_time: 1474ms, lr: 1.9255383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:13,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.42601 samples/s/p 6:13:39 } +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1046/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.9292307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:16,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43214 samples/s/p 6:13:11 } +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1048/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.9329229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:19,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.4% |███ | 5.43604 samples/s/p 6:12:52 } +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1050/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.9366153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:22,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43610 samples/s/p 6:12:48 } +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1052/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.9403076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:25,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43505 samples/s/p 6:12:50 } +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1054/ 1625], loss: 1.456, per_step_time: 1473ms, lr: 1.944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:27,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43067 samples/s/p 6:13:05 } +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1056/ 1625], loss: 0.973, per_step_time: 1474ms, lr: 1.9476924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:30,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42666 samples/s/p 6:13:19 } +2024-07-25 18:54:33,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1058/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.9513845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:33,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44201 samples/s/p 6:12:12 } +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1060/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.9550767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.44047 samples/s/p 6:12:16 } +2024-07-25 18:54:39,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1062/ 1625], loss: 1.185, per_step_time: 1474ms, lr: 1.9587691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:39,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.42488 samples/s/p 6:13:17 } +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1064/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.9624615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:42,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.5% |███ | 5.43533 samples/s/p 6:12:31 } +2024-07-25 18:54:45,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1066/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9661538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43947 samples/s/p 6:12:11 } +2024-07-25 18:54:48,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1068/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.969846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.42870 samples/s/p 6:12:52 } +2024-07-25 18:54:51,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1070/ 1625], loss: 1.237, per_step_time: 1470ms, lr: 1.9735384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:51,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.44170 samples/s/p 6:11:56 } +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1072/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.9772307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:54,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43364 samples/s/p 6:12:26 } +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1074/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.9809231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:54:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43712 samples/s/p 6:12:09 } +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1076/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 1.9846153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43671 samples/s/p 6:12:08 } +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1078/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.9883075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:03,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43112 samples/s/p 6:12:28 } +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1080/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.9919999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.6% |███ | 5.43355 samples/s/p 6:12:15 } +2024-07-25 18:55:09,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1082/ 1625], loss: 1.403, per_step_time: 1472ms, lr: 1.9956922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:09,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43257 samples/s/p 6:12:16 } +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1084/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.9993846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:12,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43380 samples/s/p 6:12:08 } +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1086/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.0030768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:15,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42857 samples/s/p 6:12:26 } +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1088/ 1625], loss: 1.225, per_step_time: 1474ms, lr: 2.0067691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:18,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42576 samples/s/p 6:12:35 } +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1090/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.0104615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:21,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43077 samples/s/p 6:12:12 } +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1092/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.0141539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:24,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43761 samples/s/p 6:11:40 } +2024-07-25 18:55:27,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1094/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.017846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:27,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.43014 samples/s/p 6:12:08 } +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1096/ 1625], loss: 1.179, per_step_time: 1474ms, lr: 2.0215382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:29,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.7% |███ | 5.42606 samples/s/p 6:12:22 } +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1098/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.0252306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:32,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43502 samples/s/p 6:11:42 } +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1100/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.028923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:35,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43218 samples/s/p 6:11:51 } +2024-07-25 18:55:38,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1102/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0326153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:38,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43458 samples/s/p 6:11:38 } +2024-07-25 18:55:41,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1104/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.0363077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:41,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.44017 samples/s/p 6:11:12 } +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1106/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.0399999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:44,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43355 samples/s/p 6:11:37 } +2024-07-25 18:55:47,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1108/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.0436923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:47,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43652 samples/s/p 6:11:21 } +2024-07-25 18:55:50,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1110/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.0473844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:50,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43441 samples/s/p 6:11:27 } +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1112/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0510768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:53,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.8% |███ | 5.43052 samples/s/p 6:11:40 } +2024-07-25 18:55:56,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1114/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.0547692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:56,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42797 samples/s/p 6:11:48 } +2024-07-25 18:55:59,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1116/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.0584614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:55:59,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43293 samples/s/p 6:11:24 } +2024-07-25 18:56:02,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1118/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0621537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:02,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43518 samples/s/p 6:11:12 } +2024-07-25 18:56:05,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1120/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 2.0658461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:05,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42506 samples/s/p 6:11:51 } +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1122/ 1625], loss: 1.272, per_step_time: 1475ms, lr: 2.0695385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:08,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.42172 samples/s/p 6:12:02 } +2024-07-25 18:56:11,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1124/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0732308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:11,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43731 samples/s/p 6:10:55 } +2024-07-25 18:56:14,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1126/ 1625], loss: 1.313, per_step_time: 1471ms, lr: 2.0769228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:14,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43626 samples/s/p 6:10:56 } +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1128/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 2.0806152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:17,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 6.9% |███ | 5.43041 samples/s/p 6:11:17 } +2024-07-25 18:56:20,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1130/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0843076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:20,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43945 samples/s/p 6:10:37 } +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1132/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:23,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43563 samples/s/p 6:10:50 } +2024-07-25 18:56:26,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1134/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.0916923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:26,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43493 samples/s/p 6:10:50 } +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1136/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.0953845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:29,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43242 samples/s/p 6:10:57 } +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1138/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0990768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:31,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43082 samples/s/p 6:11:01 } +2024-07-25 18:56:34,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1140/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.1027692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:34,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.43530 samples/s/p 6:10:39 } +2024-07-25 18:56:37,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1142/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.1064616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42777 samples/s/p 6:11:07 } +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1144/ 1625], loss: 1.341, per_step_time: 1474ms, lr: 2.1101538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:40,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.0% |███ | 5.42589 samples/s/p 6:11:12 } +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1146/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:43,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43493 samples/s/p 6:10:32 } +2024-07-25 18:56:46,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1148/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 2.1175383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:46,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42816 samples/s/p 6:10:57 } +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1150/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.1212307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:49,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.42834 samples/s/p 6:10:53 } +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1152/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.124923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:52,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43259 samples/s/p 6:10:33 } +2024-07-25 18:56:55,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1154/ 1625], loss: 0.892, per_step_time: 1471ms, lr: 2.1286154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:55,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43778 samples/s/p 6:10:09 } +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1156/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.1323076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:56:58,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43267 samples/s/p 6:10:27 } +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1158/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:01,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43235 samples/s/p 6:10:25 } +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1160/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.1396922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:04,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.1% |███ | 5.43297 samples/s/p 6:10:19 } +2024-07-25 18:57:07,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1162/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 2.1433845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:07,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.44410 samples/s/p 6:09:31 } +2024-07-25 18:57:10,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1164/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.1470767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:10,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43681 samples/s/p 6:09:58 } +2024-07-25 18:57:13,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1166/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.150769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:13,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43282 samples/s/p 6:10:11 } +2024-07-25 18:57:16,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1168/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.1544614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:16,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43451 samples/s/p 6:10:01 } +2024-07-25 18:57:19,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1170/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.1581538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:19,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43658 samples/s/p 6:09:50 } +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1172/ 1625], loss: 1.240, per_step_time: 1476ms, lr: 2.1618462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:22,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.41719 samples/s/p 6:11:06 } +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1174/ 1625], loss: 1.450, per_step_time: 1470ms, lr: 2.1655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:25,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43850 samples/s/p 6:09:36 } +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1176/ 1625], loss: 1.208, per_step_time: 1473ms, lr: 2.1692307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:28,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.42941 samples/s/p 6:10:10 } +2024-07-25 18:57:31,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1178/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1729229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:31,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.2% |███ | 5.43734 samples/s/p 6:09:35 } +2024-07-25 18:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1180/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.1766153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:33,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43290 samples/s/p 6:09:50 } +2024-07-25 18:57:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1182/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.1803076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43812 samples/s/p 6:09:26 } +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1184/ 1625], loss: 1.212, per_step_time: 1474ms, lr: 2.1839998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42687 samples/s/p 6:10:09 } +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1186/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.1876922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:42,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43257 samples/s/p 6:09:43 } +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1188/ 1625], loss: 1.028, per_step_time: 1475ms, lr: 2.1913846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:45,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42171 samples/s/p 6:10:24 } +2024-07-25 18:57:48,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1190/ 1625], loss: 1.326, per_step_time: 1470ms, lr: 2.195077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:48,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.44133 samples/s/p 6:09:01 } +2024-07-25 18:57:51,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1192/ 1625], loss: 1.019, per_step_time: 1474ms, lr: 2.1987693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:51,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.42450 samples/s/p 6:10:07 } +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1194/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 2.2024613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:54,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.3% |███ | 5.43399 samples/s/p 6:09:25 } +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1196/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.2061537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:57:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43742 samples/s/p 6:09:08 } +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1198/ 1625], loss: 0.908, per_step_time: 1471ms, lr: 2.209846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43786 samples/s/p 6:09:04 } +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1200/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.2135384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:03,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43571 samples/s/p 6:09:09 } +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1202/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.2172308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43164 samples/s/p 6:09:23 } +2024-07-25 18:58:09,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1204/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 2.220923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:09,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.42928 samples/s/p 6:09:30 } +2024-07-25 18:58:12,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1206/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.2246153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:12,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43519 samples/s/p 6:09:03 } +2024-07-25 18:58:15,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1208/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.2283077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:15,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43245 samples/s/p 6:09:11 } +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1210/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.2319999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:18,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.4% |███ | 5.43338 samples/s/p 6:09:04 } +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1212/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.2356922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:21,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.44094 samples/s/p 6:08:30 } +2024-07-25 18:58:24,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1214/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.2393844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43386 samples/s/p 6:08:56 } +2024-07-25 18:58:27,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1216/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.2430768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:27,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43832 samples/s/p 6:08:35 } +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1218/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.2467691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43395 samples/s/p 6:08:50 } +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1220/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.2504615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43789 samples/s/p 6:08:31 } +2024-07-25 18:58:35,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1222/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.2541539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:35,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43442 samples/s/p 6:08:42 } +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1224/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.257846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:38,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.42919 samples/s/p 6:09:01 } +2024-07-25 18:58:41,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1226/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.2615384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:41,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.5% |███ | 5.43617 samples/s/p 6:08:29 } +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1228/ 1625], loss: 0.934, per_step_time: 1472ms, lr: 2.2652306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43470 samples/s/p 6:08:32 } +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1230/ 1625], loss: 1.198, per_step_time: 1474ms, lr: 2.268923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:47,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.42576 samples/s/p 6:09:06 } +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1232/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2726152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:50,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43432 samples/s/p 6:08:28 } +2024-07-25 18:58:53,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1234/ 1625], loss: 1.409, per_step_time: 1471ms, lr: 2.2763075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:53,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43508 samples/s/p 6:08:22 } +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1236/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2799999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:56,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43712 samples/s/p 6:08:11 } +2024-07-25 18:58:59,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1238/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 2.2836923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:58:59,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43619 samples/s/p 6:08:11 } +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1240/ 1625], loss: 1.335, per_step_time: 1471ms, lr: 2.2873846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:02,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43807 samples/s/p 6:08:01 } +2024-07-25 18:59:05,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.2910768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:05,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.6% |███ | 5.43672 samples/s/p 6:08:03 } +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1244/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.294769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:08,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.44106 samples/s/p 6:07:43 } +2024-07-25 18:59:11,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1246/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2984614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:11,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43065 samples/s/p 6:08:22 } +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1248/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.3021537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:14,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43344 samples/s/p 6:08:08 } +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1250/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3058461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:17,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43513 samples/s/p 6:07:58 } +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1252/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3095383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:20,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43307 samples/s/p 6:08:04 } +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1254/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.3132307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:23,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43598 samples/s/p 6:07:49 } +2024-07-25 18:59:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1256/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.316923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:26,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43164 samples/s/p 6:08:03 } +2024-07-25 18:59:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1258/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.3206154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:29,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.7% |███ | 5.43579 samples/s/p 6:07:44 } +2024-07-25 18:59:32,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1260/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.3243078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:32,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42452 samples/s/p 6:08:27 } +2024-07-25 18:59:34,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1262/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3279998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:34,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42934 samples/s/p 6:08:04 } +2024-07-25 18:59:37,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1264/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.3316921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:37,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43567 samples/s/p 6:07:35 } +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1266/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.3353845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:40,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43965 samples/s/p 6:07:16 } +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1268/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.3390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:43,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43815 samples/s/p 6:07:19 } +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.3427692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:46,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43441 samples/s/p 6:07:32 } +2024-07-25 18:59:49,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1272/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.3464614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:49,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.43531 samples/s/p 6:07:25 } +2024-07-25 18:59:52,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1274/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.3501538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:52,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.8% |███ | 5.42972 samples/s/p 6:07:45 } +2024-07-25 18:59:55,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1276/ 1625], loss: 1.259, per_step_time: 1475ms, lr: 2.3538461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:55,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.42129 samples/s/p 6:08:16 } +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1278/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.3575383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 18:59:58,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44105 samples/s/p 6:06:53 } +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1280/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 2.3612307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:01,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.44011 samples/s/p 6:06:54 } +2024-07-25 19:00:04,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1282/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.3649229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:04,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43257 samples/s/p 6:07:21 } +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1284/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.3686152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:07,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43806 samples/s/p 6:06:56 } +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1286/ 1625], loss: 0.877, per_step_time: 1471ms, lr: 2.3723076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:10,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43626 samples/s/p 6:07:01 } +2024-07-25 19:00:13,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1288/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43576 samples/s/p 6:07:00 } +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1290/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.3796923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:16,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 7.9% |███ | 5.43112 samples/s/p 6:07:15 } +2024-07-25 19:00:19,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1292/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 2.3833845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:19,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43032 samples/s/p 6:07:16 } +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1294/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.3870767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:22,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43003 samples/s/p 6:07:14 } +2024-07-25 19:00:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1296/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.390769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43720 samples/s/p 6:06:42 } +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1298/ 1625], loss: 1.293, per_step_time: 1470ms, lr: 2.3944614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:28,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |███ | 5.43910 samples/s/p 6:06:31 } +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1300/ 1625], loss: 1.028, per_step_time: 1469ms, lr: 2.3981538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:31,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.44444 samples/s/p 6:06:07 } +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1302/ 1625], loss: 1.347, per_step_time: 1473ms, lr: 2.401846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:33,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43106 samples/s/p 6:06:58 } +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1304/ 1625], loss: 1.201, per_step_time: 1475ms, lr: 2.4055384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:36,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.42359 samples/s/p 6:07:25 } +2024-07-25 19:00:39,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1306/ 1625], loss: 1.377, per_step_time: 1472ms, lr: 2.4092307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:39,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43123 samples/s/p 6:06:51 } +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1308/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.4129231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:42,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.0% |████ | 5.43681 samples/s/p 6:06:26 } +2024-07-25 19:00:45,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1310/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.4166153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:45,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43089 samples/s/p 6:06:47 } +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1312/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.4203075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:48,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44114 samples/s/p 6:06:03 } +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1314/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.4239998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:51,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.44211 samples/s/p 6:05:56 } +2024-07-25 19:00:54,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1316/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 2.4276922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:54,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43521 samples/s/p 6:06:21 } +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1318/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.4313846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:00:57,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43225 samples/s/p 6:06:30 } +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1320/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.4350767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:00,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43441 samples/s/p 6:06:18 } +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1322/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.4387691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:03,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.43442 samples/s/p 6:06:15 } +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1324/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.4424615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:06,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.1% |████ | 5.42885 samples/s/p 6:06:35 } +2024-07-25 19:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1326/ 1625], loss: 1.435, per_step_time: 1472ms, lr: 2.4461538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43275 samples/s/p 6:06:16 } +2024-07-25 19:01:12,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1328/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 2.449846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43468 samples/s/p 6:06:05 } +2024-07-25 19:01:15,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1330/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.4535382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:15,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44195 samples/s/p 6:05:33 } +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1332/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.4572306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:18,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43671 samples/s/p 6:05:51 } +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1334/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.460923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:21,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43249 samples/s/p 6:06:05 } +2024-07-25 19:01:24,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1336/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.4646153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:24,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43622 samples/s/p 6:05:47 } +2024-07-25 19:01:27,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1338/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.4683077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:27,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.44135 samples/s/p 6:05:23 } +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1340/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.4719999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:30,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.2% |████ | 5.43430 samples/s/p 6:05:49 } +2024-07-25 19:01:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1342/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.4756922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:33,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43517 samples/s/p 6:05:42 } +2024-07-25 19:01:35,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1344/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.4793844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:35,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43188 samples/s/p 6:05:53 } +2024-07-25 19:01:38,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4830768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:38,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43532 samples/s/p 6:05:36 } +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1348/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.4867692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:41,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43339 samples/s/p 6:05:41 } +2024-07-25 19:01:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1350/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.4904613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:44,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43542 samples/s/p 6:05:30 } +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1352/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4941537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:47,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43338 samples/s/p 6:05:35 } +2024-07-25 19:01:50,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1354/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.497846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:50,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43787 samples/s/p 6:05:14 } +2024-07-25 19:01:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1356/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 2.5015384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.3% |████ | 5.43457 samples/s/p 6:05:24 } +2024-07-25 19:01:56,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1358/ 1625], loss: 1.326, per_step_time: 1471ms, lr: 2.5052308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:56,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43577 samples/s/p 6:05:17 } +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1360/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.508923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:01:59,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43391 samples/s/p 6:05:21 } +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1362/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.5126152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:02,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43111 samples/s/p 6:05:29 } +2024-07-25 19:02:05,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1364/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5163075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:05,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43727 samples/s/p 6:05:02 } +2024-07-25 19:02:08,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1366/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 2.5199999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:08,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.42743 samples/s/p 6:05:38 } +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1368/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5236923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:11,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43519 samples/s/p 6:05:04 } +2024-07-25 19:02:14,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1370/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.5273845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:14,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43734 samples/s/p 6:04:53 } +2024-07-25 19:02:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1372/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.5310768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.4% |████ | 5.43795 samples/s/p 6:04:47 } +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1374/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.5347692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43316 samples/s/p 6:05:04 } +2024-07-25 19:02:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1376/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5384616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:23,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43805 samples/s/p 6:04:41 } +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1378/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.5421536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:26,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42830 samples/s/p 6:05:17 } +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1380/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.545846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:29,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43403 samples/s/p 6:04:51 } +2024-07-25 19:02:32,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1382/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5495383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:32,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.43489 samples/s/p 6:04:45 } +2024-07-25 19:02:34,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1384/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.5532307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:34,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42756 samples/s/p 6:05:11 } +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1386/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.556923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:37,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42962 samples/s/p 6:05:00 } +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1388/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 2.5606152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:40,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.5% |████ | 5.42503 samples/s/p 6:05:16 } +2024-07-25 19:02:43,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1390/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.5643076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:43,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43787 samples/s/p 6:04:21 } +2024-07-25 19:02:46,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1392/ 1625], loss: 1.372, per_step_time: 1471ms, lr: 2.568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:46,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43493 samples/s/p 6:04:30 } +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1394/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.5716923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:49,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43721 samples/s/p 6:04:18 } +2024-07-25 19:02:52,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1396/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5753845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43773 samples/s/p 6:04:13 } +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1398/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.5790767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:55,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.44108 samples/s/p 6:03:56 } +2024-07-25 19:02:58,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1400/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.582769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:02:58,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43511 samples/s/p 6:04:17 } +2024-07-25 19:02:58,593 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:03:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1402/ 1625], loss: 1.293, per_step_time: 1502ms, lr: 2.5864614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.32521 samples/s/p 6:11:45 } +2024-07-25 19:03:38,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1404/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.5901538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:38,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.6% |████ | 5.43241 samples/s/p 6:04:22 } +2024-07-25 19:03:41,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1406/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.5938461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:41,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43535 samples/s/p 6:04:08 } +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1408/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5975383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:44,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43960 samples/s/p 6:03:48 } +2024-07-25 19:03:47,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1410/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6012307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:47,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43726 samples/s/p 6:03:54 } +2024-07-25 19:03:50,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1412/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.6049229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:50,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43414 samples/s/p 6:04:04 } +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1414/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.6086153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43061 samples/s/p 6:04:15 } +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1416/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.6123076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43894 samples/s/p 6:03:38 } +2024-07-25 19:03:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1418/ 1625], loss: 1.287, per_step_time: 1473ms, lr: 2.6159998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:03:59,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.43064 samples/s/p 6:04:09 } +2024-07-25 19:04:01,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1420/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.6196922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:01,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.7% |████ | 5.42906 samples/s/p 6:04:12 } +2024-07-25 19:04:04,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1422/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.6233845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:04,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43461 samples/s/p 6:03:47 } +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1424/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.6270769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:07,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43149 samples/s/p 6:03:57 } +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1426/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6307693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:10,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.42960 samples/s/p 6:04:01 } +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.6344613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:13,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43823 samples/s/p 6:03:24 } +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1430/ 1625], loss: 1.287, per_step_time: 1469ms, lr: 2.6381536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:16,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44254 samples/s/p 6:03:03 } +2024-07-25 19:04:19,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1432/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.641846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:19,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44075 samples/s/p 6:03:08 } +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1434/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.6455384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:22,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43164 samples/s/p 6:03:41 } +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1436/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6492307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:25,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.43858 samples/s/p 6:03:10 } +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1438/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.652923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:28,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.8% |████ | 5.44022 samples/s/p 6:03:01 } +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1440/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.6566153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:31,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43428 samples/s/p 6:03:22 } +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1442/ 1625], loss: 1.485, per_step_time: 1471ms, lr: 2.6603077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:34,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43634 samples/s/p 6:03:11 } +2024-07-25 19:04:37,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1444/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:37,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43131 samples/s/p 6:03:28 } +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1446/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.6676922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:40,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43238 samples/s/p 6:03:21 } +2024-07-25 19:04:43,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1448/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6713844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:43,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43143 samples/s/p 6:03:21 } +2024-07-25 19:04:46,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1450/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.6750768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:46,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43833 samples/s/p 6:02:51 } +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1452/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 2.6787691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:49,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.42936 samples/s/p 6:03:24 } +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1454/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.6824615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:52,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 8.9% |████ | 5.43360 samples/s/p 6:03:04 } +2024-07-25 19:04:55,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1456/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.6861537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:55,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43188 samples/s/p 6:03:08 } +2024-07-25 19:04:58,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1458/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.689846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:04:58,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43088 samples/s/p 6:03:09 } +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1460/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6935384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43709 samples/s/p 6:02:41 } +2024-07-25 19:05:03,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1462/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.6972306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:03,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44151 samples/s/p 6:02:21 } +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1464/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.700923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.44069 samples/s/p 6:02:21 } +2024-07-25 19:05:09,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1466/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.7046151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:09,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43964 samples/s/p 6:02:22 } +2024-07-25 19:05:12,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1468/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.7083075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:12,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43110 samples/s/p 6:02:53 } +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1470/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.7119999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:15,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.0% |████ | 5.43597 samples/s/p 6:02:31 } +2024-07-25 19:05:18,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1472/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.7156922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:18,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43137 samples/s/p 6:02:46 } +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1474/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 2.7193846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:21,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43184 samples/s/p 6:02:42 } +2024-07-25 19:05:24,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1476/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.7230768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:24,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43629 samples/s/p 6:02:21 } +2024-07-25 19:05:27,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1478/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.7267692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:27,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42628 samples/s/p 6:02:58 } +2024-07-25 19:05:30,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1480/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.7304613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:30,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43405 samples/s/p 6:02:24 } +2024-07-25 19:05:33,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1482/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.7341537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:33,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.43623 samples/s/p 6:02:12 } +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1484/ 1625], loss: 1.093, per_step_time: 1474ms, lr: 2.737846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:36,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42685 samples/s/p 6:02:47 } +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1486/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.7415383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:39,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.1% |████ | 5.42894 samples/s/p 6:02:35 } +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1488/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.7452306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:42,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43319 samples/s/p 6:02:16 } +2024-07-25 19:05:45,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1490/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.748923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:45,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43590 samples/s/p 6:02:02 } +2024-07-25 19:05:48,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1492/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.7526154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:48,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43243 samples/s/p 6:02:13 } +2024-07-25 19:05:51,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1494/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.7563077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:51,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43421 samples/s/p 6:02:03 } +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1496/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7599997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43350 samples/s/p 6:02:03 } +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1498/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7636921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:05:57,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43284 samples/s/p 6:02:02 } +2024-07-25 19:06:00,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1500/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.7673845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:00,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43339 samples/s/p 6:01:57 } +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1502/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.7710768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:02,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.2% |████ | 5.43248 samples/s/p 6:01:58 } +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1504/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.7747692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:05,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42852 samples/s/p 6:02:11 } +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1506/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.7784614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:08,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43709 samples/s/p 6:01:33 } +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1508/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.7821538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:11,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43410 samples/s/p 6:01:42 } +2024-07-25 19:06:14,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1510/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.7858461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:14,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43211 samples/s/p 6:01:47 } +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1512/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7895383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:17,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43378 samples/s/p 6:01:38 } +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1514/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.7932307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:20,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43256 samples/s/p 6:01:40 } +2024-07-25 19:06:23,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1516/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.7969229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:23,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.42814 samples/s/p 6:01:54 } +2024-07-25 19:06:26,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1518/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8006152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:26,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.3% |████ | 5.43994 samples/s/p 6:01:04 } +2024-07-25 19:06:29,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1520/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8043076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43288 samples/s/p 6:01:30 } +2024-07-25 19:06:32,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:32,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43322 samples/s/p 6:01:25 } +2024-07-25 19:06:35,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1524/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 2.8116921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:35,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43243 samples/s/p 6:01:26 } +2024-07-25 19:06:38,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1526/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.8153845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:38,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.42860 samples/s/p 6:01:38 } +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1528/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8190769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43322 samples/s/p 6:01:16 } +2024-07-25 19:06:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1530/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.822769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43789 samples/s/p 6:00:55 } +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1532/ 1625], loss: 1.023, per_step_time: 1473ms, lr: 2.8264614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:47,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43032 samples/s/p 6:01:22 } +2024-07-25 19:06:50,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1534/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.8301536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:50,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.4% |████ | 5.43599 samples/s/p 6:00:57 } +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1536/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.833846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43911 samples/s/p 6:00:41 } +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1538/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.8375383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:56,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43876 samples/s/p 6:00:40 } +2024-07-25 19:06:59,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1540/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.8412307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:06:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43556 samples/s/p 6:00:50 } +2024-07-25 19:07:02,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1542/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.844923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:02,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43122 samples/s/p 6:01:04 } +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1544/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8486153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:04,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43175 samples/s/p 6:00:59 } +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1546/ 1625], loss: 0.967, per_step_time: 1475ms, lr: 2.8523074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:07,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.42351 samples/s/p 6:01:29 } +2024-07-25 19:07:10,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1548/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.8559998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43160 samples/s/p 6:00:54 } +2024-07-25 19:07:13,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1550/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8596922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:13,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.5% |████ | 5.43121 samples/s/p 6:00:52 } +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1552/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.8633845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:16,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43648 samples/s/p 6:00:28 } +2024-07-25 19:07:19,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1554/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.8670767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:19,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43213 samples/s/p 6:00:43 } +2024-07-25 19:07:22,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1556/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.8707691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:22,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42752 samples/s/p 6:00:58 } +2024-07-25 19:07:25,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1558/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.8744615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:25,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43409 samples/s/p 6:00:29 } +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1560/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8781538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43583 samples/s/p 6:00:19 } +2024-07-25 19:07:31,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1562/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8818462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:31,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43139 samples/s/p 6:00:34 } +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1564/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8855382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:34,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43497 samples/s/p 6:00:17 } +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1566/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.8892306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.42630 samples/s/p 6:00:48 } +2024-07-25 19:07:40,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1568/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.892923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:40,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.6% |████ | 5.43076 samples/s/p 6:00:27 } +2024-07-25 19:07:43,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1570/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.8966153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:43,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.42640 samples/s/p 6:00:42 } +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1572/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.9003077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:46,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.42999 samples/s/p 6:00:25 } +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1574/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.9039998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43925 samples/s/p 5:59:45 } +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1576/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9076922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43282 samples/s/p 6:00:07 } +2024-07-25 19:07:55,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1578/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9113846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:55,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43362 samples/s/p 6:00:01 } +2024-07-25 19:07:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1580/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.9150768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:07:58,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43854 samples/s/p 5:59:39 } +2024-07-25 19:08:01,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1582/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.9187691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:01,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43737 samples/s/p 5:59:41 } +2024-07-25 19:08:04,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1584/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9224613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:04,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.7% |████ | 5.43663 samples/s/p 5:59:41 } +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1586/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 2.9261537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:06,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43767 samples/s/p 5:59:33 } +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1588/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.929846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:09,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43556 samples/s/p 5:59:39 } +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1590/ 1625], loss: 1.431, per_step_time: 1471ms, lr: 2.9335384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:12,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43625 samples/s/p 5:59:33 } +2024-07-25 19:08:15,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9372306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:15,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43377 samples/s/p 5:59:40 } +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1594/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.940923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:18,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43509 samples/s/p 5:59:32 } +2024-07-25 19:08:21,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1596/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 2.9446152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:21,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.42016 samples/s/p 6:00:28 } +2024-07-25 19:08:24,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1598/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.9483075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.44164 samples/s/p 5:59:00 } +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1600/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.9519999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:27,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.8% |████ | 5.43682 samples/s/p 5:59:16 } +2024-07-25 19:08:30,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1602/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.955692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43079 samples/s/p 5:59:37 } +2024-07-25 19:08:33,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1604/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.9593844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:33,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42516 samples/s/p 5:59:57 } +2024-07-25 19:08:36,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1606/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.9630768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:36,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43510 samples/s/p 5:59:14 } +2024-07-25 19:08:39,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1608/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9667692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:39,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43119 samples/s/p 5:59:27 } +2024-07-25 19:08:42,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1610/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.9704615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:42,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.42443 samples/s/p 5:59:51 } +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1612/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.9741537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:45,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43646 samples/s/p 5:59:00 } +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1614/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.9778459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:48,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43482 samples/s/p 5:59:04 } +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1616/ 1625], loss: 1.134, per_step_time: 1473ms, lr: 2.9815383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:51,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 9.9% |████ | 5.43090 samples/s/p 5:59:16 } +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1618/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.9852306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:54,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.44097 samples/s/p 5:58:33 } +2024-07-25 19:08:57,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1620/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.988923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:08:57,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43385 samples/s/p 5:58:59 } +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1622/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9926152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:00,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43693 samples/s/p 5:58:43 } +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 1/ 10], step:[ 1624/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 2.9963076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:03,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |████ | 5.43165 samples/s/p 5:59:01 } +2024-07-25 19:09:06,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1478ms, lr: 3e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:06,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.41160 samples/s/p 6:00:18 } +2024-07-25 19:09:08,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 3/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.9999997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:08,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43734 samples/s/p 5:58:33 } +2024-07-25 19:09:11,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 5/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.9999994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:11,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43595 samples/s/p 5:58:36 } +2024-07-25 19:09:14,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 7/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.9999987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:14,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.0% |█████ | 5.43214 samples/s/p 5:58:48 } +2024-07-25 19:09:17,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 9/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.999998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:17,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43608 samples/s/p 5:58:29 } +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 11/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 2.9999967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:20,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.42960 samples/s/p 5:58:52 } +2024-07-25 19:09:23,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 13/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9999952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:23,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.42571 samples/s/p 5:59:04 } +2024-07-25 19:09:26,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 15/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9999934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:26,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43534 samples/s/p 5:58:23 } +2024-07-25 19:09:29,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 17/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.9999912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:29,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43444 samples/s/p 5:58:24 } +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 19/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.999989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:32,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43511 samples/s/p 5:58:18 } +2024-07-25 19:09:35,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 21/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.9999865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:35,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43474 samples/s/p 5:58:17 } +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 23/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.9999837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:38,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.1% |█████ | 5.43913 samples/s/p 5:57:56 } +2024-07-25 19:09:41,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 25/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9999806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:41,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43775 samples/s/p 5:57:59 } +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 27/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9999774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:44,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43653 samples/s/p 5:58:01 } +2024-07-25 19:09:47,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 29/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.9999737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:47,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43771 samples/s/p 5:57:53 } +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 31/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.99997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:50,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43729 samples/s/p 5:57:52 } +2024-07-25 19:09:53,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 33/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9999657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:53,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43497 samples/s/p 5:57:58 } +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 35/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.9999612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:56,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43833 samples/s/p 5:57:42 } +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 37/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9999566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:09:59,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43813 samples/s/p 5:57:40 } +2024-07-25 19:10:02,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 39/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.9999517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:02,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.2% |█████ | 5.43986 samples/s/p 5:57:30 } +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 41/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 2.9999464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:05,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43928 samples/s/p 5:57:29 } +2024-07-25 19:10:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 43/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9999408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43021 samples/s/p 5:58:02 } +2024-07-25 19:10:10,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 45/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9999354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:10,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44013 samples/s/p 5:57:20 } +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 47/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.999929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:13,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43431 samples/s/p 5:57:40 } +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 49/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.9999228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:16,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43646 samples/s/p 5:57:29 } +2024-07-25 19:10:19,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 51/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9999163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:19,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.43389 samples/s/p 5:57:36 } +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 53/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 2.9999095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:22,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.42454 samples/s/p 5:58:10 } +2024-07-25 19:10:25,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 55/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 2.9999024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:25,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.3% |█████ | 5.44186 samples/s/p 5:56:59 } +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 57/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.999895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:28,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43313 samples/s/p 5:57:30 } +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 59/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9998875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:31,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43803 samples/s/p 5:57:08 } +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 61/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.9998797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:34,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42944 samples/s/p 5:57:39 } +2024-07-25 19:10:37,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 63/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 2.9998713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:37,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43172 samples/s/p 5:57:27 } +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 65/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.999863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:40,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42972 samples/s/p 5:57:32 } +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 67/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.9998542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:43,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43102 samples/s/p 5:57:24 } +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 69/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.9998453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:46,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.42915 samples/s/p 5:57:28 } +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 71/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.999836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:49,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43676 samples/s/p 5:56:55 } +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 73/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9998266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:52,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.4% |█████ | 5.43485 samples/s/p 5:57:00 } +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 75/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 2.9998168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:55,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43905 samples/s/p 5:56:40 } +2024-07-25 19:10:58,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 77/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9998067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:10:58,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43625 samples/s/p 5:56:48 } +2024-07-25 19:11:01,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 79/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9997964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:01,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43580 samples/s/p 5:56:47 } +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 81/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9997858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:04,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43374 samples/s/p 5:56:52 } +2024-07-25 19:11:07,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 83/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.999775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:07,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42667 samples/s/p 5:57:17 } +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 85/ 1625], loss: 1.437, per_step_time: 1471ms, lr: 2.9997638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:09,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43590 samples/s/p 5:56:38 } +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 87/ 1625], loss: 1.165, per_step_time: 1474ms, lr: 2.9997524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:12,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.42666 samples/s/p 5:57:11 } +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 89/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.9997409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:15,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.5% |█████ | 5.43652 samples/s/p 5:56:30 } +2024-07-25 19:11:18,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 91/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9997289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:18,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43360 samples/s/p 5:56:38 } +2024-07-25 19:11:21,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 93/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.9997167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:21,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43228 samples/s/p 5:56:40 } +2024-07-25 19:11:24,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 95/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 2.9997043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:24,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43148 samples/s/p 5:56:41 } +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 97/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9996916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:27,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43330 samples/s/p 5:56:31 } +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 99/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.9996787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:30,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43049 samples/s/p 5:56:39 } +2024-07-25 19:11:33,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 101/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 2.9996652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:33,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.44398 samples/s/p 5:55:43 } +2024-07-25 19:11:36,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 103/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.9996518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:36,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43064 samples/s/p 5:56:32 } +2024-07-25 19:11:39,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 105/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.9996381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:39,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.6% |█████ | 5.43816 samples/s/p 5:56:00 } +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 2.9996241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:42,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42401 samples/s/p 5:56:52 } +2024-07-25 19:11:45,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 109/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9996096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:45,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43630 samples/s/p 5:56:01 } +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 111/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 2.999595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:48,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43547 samples/s/p 5:56:01 } +2024-07-25 19:11:51,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 113/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 2.9995803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:51,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43092 samples/s/p 5:56:16 } +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 115/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9995652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:54,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43563 samples/s/p 5:55:55 } +2024-07-25 19:11:57,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 117/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.9995497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:11:57,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43457 samples/s/p 5:55:56 } +2024-07-25 19:12:00,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 119/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.9995343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:00,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.43050 samples/s/p 5:56:09 } +2024-07-25 19:12:03,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 121/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9995184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:03,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.7% |█████ | 5.42958 samples/s/p 5:56:10 } +2024-07-25 19:12:06,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 123/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.999502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:06,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43119 samples/s/p 5:56:01 } +2024-07-25 19:12:09,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 125/ 1625], loss: 0.999, per_step_time: 1470ms, lr: 2.9994857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:09,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.44026 samples/s/p 5:55:22 } +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 127/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.9994688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:11,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43469 samples/s/p 5:55:41 } +2024-07-25 19:12:14,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 129/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.999452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:14,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42985 samples/s/p 5:55:57 } +2024-07-25 19:12:17,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 131/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.9994346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:17,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43780 samples/s/p 5:55:23 } +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 133/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9994171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:20,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43775 samples/s/p 5:55:20 } +2024-07-25 19:12:23,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 135/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.9993993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:23,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.42794 samples/s/p 5:55:56 } +2024-07-25 19:12:26,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 137/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.9993813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:26,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.8% |█████ | 5.43172 samples/s/p 5:55:38 } +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 139/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.9993627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:29,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43184 samples/s/p 5:55:34 } +2024-07-25 19:12:32,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 141/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.9993444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:32,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43422 samples/s/p 5:55:22 } +2024-07-25 19:12:35,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 143/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9993254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:35,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42878 samples/s/p 5:55:41 } +2024-07-25 19:12:38,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 145/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.9993065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:38,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43104 samples/s/p 5:55:29 } +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 147/ 1625], loss: 1.284, per_step_time: 1469ms, lr: 2.9992867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:41,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.44263 samples/s/p 5:54:40 } +2024-07-25 19:12:44,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 149/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.9992674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:44,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.42853 samples/s/p 5:55:33 } +2024-07-25 19:12:47,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 151/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.9992474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:47,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43506 samples/s/p 5:55:04 } +2024-07-25 19:12:50,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 153/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.9992269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:50,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 10.9% |█████ | 5.43266 samples/s/p 5:55:11 } +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 155/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9992065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:53,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43324 samples/s/p 5:55:05 } +2024-07-25 19:12:56,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 157/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9991857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:56,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43186 samples/s/p 5:55:08 } +2024-07-25 19:12:59,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 159/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9991646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:12:59,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43316 samples/s/p 5:55:00 } +2024-07-25 19:13:02,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 161/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9991435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:02,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43697 samples/s/p 5:54:42 } +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 163/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.9991223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:05,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43354 samples/s/p 5:54:52 } +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 165/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.9991003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43061 samples/s/p 5:55:01 } +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 167/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.999078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:10,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43293 samples/s/p 5:54:49 } +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 169/ 1625], loss: 1.446, per_step_time: 1471ms, lr: 2.9990559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:13,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.0% |█████ | 5.43835 samples/s/p 5:54:25 } +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 171/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 2.9990333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:16,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43223 samples/s/p 5:54:46 } +2024-07-25 19:13:19,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 173/ 1625], loss: 1.360, per_step_time: 1473ms, lr: 2.9990104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:19,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42992 samples/s/p 5:54:52 } +2024-07-25 19:13:22,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 175/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9989871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:22,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43454 samples/s/p 5:54:31 } +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 177/ 1625], loss: 0.964, per_step_time: 1474ms, lr: 2.9989636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:25,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42667 samples/s/p 5:54:59 } +2024-07-25 19:13:28,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 179/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.99894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:28,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.42793 samples/s/p 5:54:51 } +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 181/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 2.9989162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:31,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43770 samples/s/p 5:54:10 } +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 183/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.998892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:34,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.44025 samples/s/p 5:53:57 } +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 185/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 2.9988674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:37,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.1% |█████ | 5.43072 samples/s/p 5:54:31 } +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 187/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.9988425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:40,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43409 samples/s/p 5:54:15 } +2024-07-25 19:13:43,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 189/ 1625], loss: 1.393, per_step_time: 1473ms, lr: 2.9988176e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:43,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43078 samples/s/p 5:54:25 } +2024-07-25 19:13:46,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 191/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9987923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:46,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43240 samples/s/p 5:54:16 } +2024-07-25 19:13:49,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 193/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.9987668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:49,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43347 samples/s/p 5:54:09 } +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 195/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9987412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:52,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43184 samples/s/p 5:54:12 } +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 197/ 1625], loss: 1.166, per_step_time: 1469ms, lr: 2.998715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:55,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.44285 samples/s/p 5:53:26 } +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 199/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.9986886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:13:58,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.42914 samples/s/p 5:54:17 } +2024-07-25 19:14:01,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 201/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.9986619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:01,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43749 samples/s/p 5:53:41 } +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 203/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.9986351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:04,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.2% |█████ | 5.43271 samples/s/p 5:53:57 } +2024-07-25 19:14:07,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 205/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9986079e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:07,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43733 samples/s/p 5:53:36 } +2024-07-25 19:14:10,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 207/ 1625], loss: 1.261, per_step_time: 1474ms, lr: 2.9985804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:10,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42725 samples/s/p 5:54:12 } +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 209/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9985527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:12,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43198 samples/s/p 5:53:51 } +2024-07-25 19:14:15,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 211/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.9985247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:15,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.42613 samples/s/p 5:54:11 } +2024-07-25 19:14:18,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 213/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 2.9984965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:18,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43528 samples/s/p 5:53:32 } +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 215/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9984682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:21,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43258 samples/s/p 5:53:40 } +2024-07-25 19:14:24,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 217/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.9984394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:24,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43778 samples/s/p 5:53:16 } +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 219/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9984103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:27,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.3% |█████ | 5.43027 samples/s/p 5:53:43 } +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 221/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 2.998381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:30,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43680 samples/s/p 5:53:14 } +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 223/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9983512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:33,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43269 samples/s/p 5:53:27 } +2024-07-25 19:14:36,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 225/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9983215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:36,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43437 samples/s/p 5:53:18 } +2024-07-25 19:14:39,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 227/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9982915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:39,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43219 samples/s/p 5:53:23 } +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 229/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9982612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:42,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43859 samples/s/p 5:52:56 } +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 231/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.9982306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:45,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42842 samples/s/p 5:53:32 } +2024-07-25 19:14:48,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 233/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.9981999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:48,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.43350 samples/s/p 5:53:10 } +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 235/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.9981686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:51,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.4% |█████ | 5.42821 samples/s/p 5:53:27 } +2024-07-25 19:14:54,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 237/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.998137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:54,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43559 samples/s/p 5:52:55 } +2024-07-25 19:14:57,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 239/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.9981054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:14:57,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.44040 samples/s/p 5:52:34 } +2024-07-25 19:15:00,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 241/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.9980733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:00,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43842 samples/s/p 5:52:39 } +2024-07-25 19:15:03,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 243/ 1625], loss: 1.040, per_step_time: 1474ms, lr: 2.9980412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:03,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42736 samples/s/p 5:53:19 } +2024-07-25 19:15:06,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 245/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 2.9980087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:06,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42751 samples/s/p 5:53:15 } +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 247/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.997976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:09,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.42752 samples/s/p 5:53:12 } +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 249/ 1625], loss: 1.375, per_step_time: 1472ms, lr: 2.9979428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:12,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43295 samples/s/p 5:52:48 } +2024-07-25 19:15:14,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 251/ 1625], loss: 1.068, per_step_time: 1472ms, lr: 2.9979094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:14,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.5% |█████ | 5.43316 samples/s/p 5:52:44 } +2024-07-25 19:15:17,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 253/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 2.9978759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:17,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44133 samples/s/p 5:52:10 } +2024-07-25 19:15:20,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 255/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 2.997842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:20,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.44202 samples/s/p 5:52:04 } +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 257/ 1625], loss: 1.338, per_step_time: 1472ms, lr: 2.9978082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:23,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43330 samples/s/p 5:52:35 } +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 259/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.9977735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:26,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43720 samples/s/p 5:52:17 } +2024-07-25 19:15:29,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 261/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 2.997739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:29,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43920 samples/s/p 5:52:06 } +2024-07-25 19:15:32,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 263/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.997704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:32,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43956 samples/s/p 5:52:02 } +2024-07-25 19:15:35,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 265/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9976689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:35,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43683 samples/s/p 5:52:09 } +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 267/ 1625], loss: 1.371, per_step_time: 1471ms, lr: 2.9976336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:38,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.6% |█████ | 5.43647 samples/s/p 5:52:08 } +2024-07-25 19:15:41,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 269/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.9975978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:41,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43315 samples/s/p 5:52:18 } +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 271/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9975616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:44,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43787 samples/s/p 5:51:57 } +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 273/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9975256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:47,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43729 samples/s/p 5:51:56 } +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 275/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.997489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:50,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43422 samples/s/p 5:52:05 } +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 277/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.997452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:53,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43325 samples/s/p 5:52:06 } +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 279/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9974155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:56,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43247 samples/s/p 5:52:06 } +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 281/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9973779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:15:59,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43975 samples/s/p 5:51:35 } +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 283/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.9973404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:02,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.7% |█████ | 5.43538 samples/s/p 5:51:49 } +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 285/ 1625], loss: 1.124, per_step_time: 1470ms, lr: 2.9973024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:05,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.44073 samples/s/p 5:51:25 } +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 287/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9972643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:08,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43474 samples/s/p 5:51:45 } +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 289/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.997226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:11,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.42867 samples/s/p 5:52:06 } +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 291/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.9971872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:13,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43100 samples/s/p 5:51:54 } +2024-07-25 19:16:16,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 293/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9971485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:16,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43227 samples/s/p 5:51:46 } +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 295/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.9971094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:19,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43159 samples/s/p 5:51:46 } +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 297/ 1625], loss: 0.980, per_step_time: 1471ms, lr: 2.9970697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:22,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43806 samples/s/p 5:51:18 } +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 299/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.9970299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:25,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.8% |█████ | 5.43801 samples/s/p 5:51:15 } +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 301/ 1625], loss: 1.029, per_step_time: 1473ms, lr: 2.9969902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:28,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43013 samples/s/p 5:51:43 } +2024-07-25 19:16:31,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 303/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 2.99695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:31,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.42624 samples/s/p 5:51:55 } +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 305/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9969093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:34,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43544 samples/s/p 5:51:16 } +2024-07-25 19:16:37,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 307/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.9968685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:37,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43958 samples/s/p 5:50:57 } +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 309/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.9968276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:40,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43347 samples/s/p 5:51:18 } +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 311/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.9967863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:43,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43837 samples/s/p 5:50:56 } +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 313/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.9967445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:46,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.43123 samples/s/p 5:51:21 } +2024-07-25 19:16:49,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 315/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.9967028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:49,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 11.9% |█████ | 5.44317 samples/s/p 5:50:31 } +2024-07-25 19:16:52,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 317/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.9966604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:52,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42866 samples/s/p 5:51:25 } +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 319/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.9966182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:55,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43409 samples/s/p 5:51:01 } +2024-07-25 19:16:58,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9965757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:16:58,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.43369 samples/s/p 5:50:59 } +2024-07-25 19:17:01,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 323/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9965326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:01,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |█████ | 5.42933 samples/s/p 5:51:13 } +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 325/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.9964896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:04,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.44122 samples/s/p 5:50:24 } +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 327/ 1625], loss: 1.159, per_step_time: 1474ms, lr: 2.996446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:07,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.42713 samples/s/p 5:51:16 } +2024-07-25 19:17:10,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 329/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9964021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:10,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43753 samples/s/p 5:50:33 } +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 331/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.9963583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:13,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43359 samples/s/p 5:50:45 } +2024-07-25 19:17:15,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 333/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.996314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:15,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.0% |██████ | 5.43473 samples/s/p 5:50:38 } +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 335/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.9962694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:18,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43454 samples/s/p 5:50:35 } +2024-07-25 19:17:21,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 337/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.9962248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:21,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43096 samples/s/p 5:50:46 } +2024-07-25 19:17:24,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 339/ 1625], loss: 1.010, per_step_time: 1470ms, lr: 2.9961797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:24,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.44072 samples/s/p 5:50:06 } +2024-07-25 19:17:27,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 341/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.9961344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:27,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43989 samples/s/p 5:50:06 } +2024-07-25 19:17:30,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 343/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.9960887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:30,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43333 samples/s/p 5:50:28 } +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 345/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.9960429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:33,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43742 samples/s/p 5:50:09 } +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 347/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.9959969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:36,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43276 samples/s/p 5:50:25 } +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 349/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.9959503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:39,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.1% |██████ | 5.43328 samples/s/p 5:50:20 } +2024-07-25 19:17:42,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 351/ 1625], loss: 1.294, per_step_time: 1470ms, lr: 2.9959036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:42,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43876 samples/s/p 5:49:55 } +2024-07-25 19:17:45,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 353/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.995857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:45,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43348 samples/s/p 5:50:13 } +2024-07-25 19:17:48,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 355/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.9958097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:48,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43521 samples/s/p 5:50:03 } +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 357/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 2.9957622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:51,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43944 samples/s/p 5:49:44 } +2024-07-25 19:17:54,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 359/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 2.9957146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:54,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43111 samples/s/p 5:50:13 } +2024-07-25 19:17:57,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 361/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9956665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:17:57,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43715 samples/s/p 5:49:47 } +2024-07-25 19:18:00,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 363/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.9956182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:00,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43481 samples/s/p 5:49:53 } +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 365/ 1625], loss: 1.378, per_step_time: 1472ms, lr: 2.9955698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:03,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.2% |██████ | 5.43185 samples/s/p 5:50:02 } +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 367/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.995521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:06,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43657 samples/s/p 5:49:40 } +2024-07-25 19:18:09,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 369/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.995472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:09,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43282 samples/s/p 5:49:52 } +2024-07-25 19:18:12,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 371/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9954224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:12,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43281 samples/s/p 5:49:49 } +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 373/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.9953728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:14,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43236 samples/s/p 5:49:48 } +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 375/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.995323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:17,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43066 samples/s/p 5:49:51 } +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 377/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9952727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:20,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43240 samples/s/p 5:49:42 } +2024-07-25 19:18:23,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 379/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.9952223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:23,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.43144 samples/s/p 5:49:43 } +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 381/ 1625], loss: 1.076, per_step_time: 1469ms, lr: 2.9951718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:26,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.3% |██████ | 5.44352 samples/s/p 5:48:53 } +2024-07-25 19:18:29,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 383/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 2.995121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:29,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43485 samples/s/p 5:49:23 } +2024-07-25 19:18:32,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 385/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.9950697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:32,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42901 samples/s/p 5:49:43 } +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 387/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9950183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:35,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43784 samples/s/p 5:49:06 } +2024-07-25 19:18:38,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 389/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.9949666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:38,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43157 samples/s/p 5:49:27 } +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 391/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.9949146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:41,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.43170 samples/s/p 5:49:24 } +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 393/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.9948624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:44,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42804 samples/s/p 5:49:35 } +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 395/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 2.9948098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:47,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.44173 samples/s/p 5:48:39 } +2024-07-25 19:18:50,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 397/ 1625], loss: 1.052, per_step_time: 1473ms, lr: 2.9947569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:50,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.4% |██████ | 5.42814 samples/s/p 5:49:29 } +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 399/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.9947041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:53,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43518 samples/s/p 5:48:59 } +2024-07-25 19:18:56,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 401/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.9946505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:56,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43570 samples/s/p 5:48:54 } +2024-07-25 19:18:59,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 403/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.994597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:18:59,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43981 samples/s/p 5:48:35 } +2024-07-25 19:19:02,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 405/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.994543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:02,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.42750 samples/s/p 5:49:19 } +2024-07-25 19:19:05,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 407/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 2.994489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:05,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43872 samples/s/p 5:48:33 } +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 409/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.9944347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:08,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43324 samples/s/p 5:48:51 } +2024-07-25 19:19:11,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 411/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 2.9943802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:11,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.44042 samples/s/p 5:48:21 } +2024-07-25 19:19:13,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 413/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9943252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:14,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.5% |██████ | 5.43301 samples/s/p 5:48:46 } +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 415/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.9942697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:16,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43679 samples/s/p 5:48:29 } +2024-07-25 19:19:19,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 417/ 1625], loss: 0.937, per_step_time: 1471ms, lr: 2.994214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:19,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43573 samples/s/p 5:48:30 } +2024-07-25 19:19:22,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 419/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 2.9941586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:22,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42614 samples/s/p 5:49:04 } +2024-07-25 19:19:25,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 421/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 2.9941026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:25,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43929 samples/s/p 5:48:10 } +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 423/ 1625], loss: 1.266, per_step_time: 1469ms, lr: 2.9940466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:28,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.44512 samples/s/p 5:47:45 } +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 425/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.9939898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:31,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.43673 samples/s/p 5:48:14 } +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 427/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9939329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:34,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42876 samples/s/p 5:48:42 } +2024-07-25 19:19:37,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 429/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9938761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:37,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.6% |██████ | 5.42957 samples/s/p 5:48:36 } +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 431/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.9938186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:40,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43443 samples/s/p 5:48:14 } +2024-07-25 19:19:43,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 433/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.9937613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:43,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43992 samples/s/p 5:47:50 } +2024-07-25 19:19:46,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 435/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.9937031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:46,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43257 samples/s/p 5:48:16 } +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 437/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9936451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:49,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43591 samples/s/p 5:48:00 } +2024-07-25 19:19:52,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 439/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.9935867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:52,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43568 samples/s/p 5:47:58 } +2024-07-25 19:19:55,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.993528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:55,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.44235 samples/s/p 5:47:29 } +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 443/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9934692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:19:58,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43346 samples/s/p 5:48:00 } +2024-07-25 19:20:01,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 445/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.9934099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:01,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.7% |██████ | 5.43404 samples/s/p 5:47:55 } +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 447/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.9933506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:04,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43143 samples/s/p 5:48:02 } +2024-07-25 19:20:07,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 449/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.9932908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:07,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43349 samples/s/p 5:47:52 } +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 451/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9932306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:10,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43320 samples/s/p 5:47:50 } +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 453/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9931705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:13,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43109 samples/s/p 5:47:55 } +2024-07-25 19:20:15,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 455/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.99311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:15,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43039 samples/s/p 5:47:55 } +2024-07-25 19:20:18,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 457/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.9930492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:18,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43663 samples/s/p 5:47:28 } +2024-07-25 19:20:21,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 459/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.992988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:21,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.43086 samples/s/p 5:47:47 } +2024-07-25 19:20:24,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 461/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9929268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:24,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.42530 samples/s/p 5:48:05 } +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 463/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.9928653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:27,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.8% |██████ | 5.44005 samples/s/p 5:47:06 } +2024-07-25 19:20:30,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 465/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.9928033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43020 samples/s/p 5:47:41 } +2024-07-25 19:20:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 467/ 1625], loss: 1.345, per_step_time: 1472ms, lr: 2.9927412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43296 samples/s/p 5:47:27 } +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 469/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.9926789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:36,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43519 samples/s/p 5:47:16 } +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 471/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.9926163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:39,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43477 samples/s/p 5:47:14 } +2024-07-25 19:20:42,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 473/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 2.9925533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:42,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43778 samples/s/p 5:47:00 } +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 475/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.99249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:45,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.44493 samples/s/p 5:46:29 } +2024-07-25 19:20:48,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 477/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.9924267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:48,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43761 samples/s/p 5:46:55 } +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 479/ 1625], loss: 1.109, per_step_time: 1471ms, lr: 2.9923629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:51,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 12.9% |██████ | 5.43661 samples/s/p 5:46:55 } +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 481/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.9922989e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:54,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43298 samples/s/p 5:47:06 } +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 483/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.9922347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:20:57,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43394 samples/s/p 5:47:00 } +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 485/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.9921703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:00,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44050 samples/s/p 5:46:32 } +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 487/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 2.9921053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:03,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43098 samples/s/p 5:47:05 } +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 489/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 2.9920404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:06,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43146 samples/s/p 5:47:00 } +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 491/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.991975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:09,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43463 samples/s/p 5:46:45 } +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 493/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 2.9919096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:12,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.44287 samples/s/p 5:46:11 } +2024-07-25 19:21:14,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 495/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9918436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:14,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.0% |██████ | 5.43060 samples/s/p 5:46:55 } +2024-07-25 19:21:17,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 497/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.9917775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:17,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43832 samples/s/p 5:46:22 } +2024-07-25 19:21:20,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 499/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.9917113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:20,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43561 samples/s/p 5:46:30 } +2024-07-25 19:21:23,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 501/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.9916446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:23,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43732 samples/s/p 5:46:20 } +2024-07-25 19:21:26,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 503/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9915775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:26,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43330 samples/s/p 5:46:33 } +2024-07-25 19:21:29,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 505/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9915103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:29,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43647 samples/s/p 5:46:18 } +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 507/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.991443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:32,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43011 samples/s/p 5:46:39 } +2024-07-25 19:21:35,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 509/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9913752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:35,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43707 samples/s/p 5:46:10 } +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 511/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.9913072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:38,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.1% |██████ | 5.43586 samples/s/p 5:46:11 } +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 513/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.991239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:41,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43447 samples/s/p 5:46:14 } +2024-07-25 19:21:44,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 515/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 2.9911704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:44,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43785 samples/s/p 5:45:58 } +2024-07-25 19:21:47,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 517/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.9911018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:47,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.42895 samples/s/p 5:46:29 } +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 519/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.9910327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:50,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43514 samples/s/p 5:46:02 } +2024-07-25 19:21:53,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 521/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9909634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:53,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43210 samples/s/p 5:46:11 } +2024-07-25 19:21:56,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 523/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 2.9908939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:56,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43087 samples/s/p 5:46:13 } +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 525/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.9908242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:21:59,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43588 samples/s/p 5:45:51 } +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 527/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.9907538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:02,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.2% |██████ | 5.43992 samples/s/p 5:45:32 } +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 529/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9906834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:05,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43089 samples/s/p 5:46:04 } +2024-07-25 19:22:08,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 531/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.9906128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:08,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43417 samples/s/p 5:45:48 } +2024-07-25 19:22:11,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 533/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.990542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:11,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.42930 samples/s/p 5:46:04 } +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 535/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.9904708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:14,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43193 samples/s/p 5:45:51 } +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 537/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.9903993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:16,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43642 samples/s/p 5:45:31 } +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9903278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:19,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43283 samples/s/p 5:45:42 } +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 541/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9902556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:22,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43262 samples/s/p 5:45:39 } +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 543/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.9901834e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:25,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.3% |██████ | 5.43464 samples/s/p 5:45:29 } +2024-07-25 19:22:28,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 545/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 2.990111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:28,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44105 samples/s/p 5:45:01 } +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 547/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 2.990038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:31,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43139 samples/s/p 5:45:35 } +2024-07-25 19:22:34,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 549/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.9899651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:34,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43441 samples/s/p 5:45:21 } +2024-07-25 19:22:37,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 551/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.9898918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:37,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43062 samples/s/p 5:45:32 } +2024-07-25 19:22:40,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 553/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.9898185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:40,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43833 samples/s/p 5:45:00 } +2024-07-25 19:22:43,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 555/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.9897445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:43,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.44016 samples/s/p 5:44:50 } +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 557/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 2.9896704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:46,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.43087 samples/s/p 5:45:23 } +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 559/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9895962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:49,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.4% |██████ | 5.42763 samples/s/p 5:45:32 } +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 561/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9895215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:52,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43753 samples/s/p 5:44:51 } +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 563/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.9894465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:55,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.44023 samples/s/p 5:44:38 } +2024-07-25 19:22:58,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 565/ 1625], loss: 1.060, per_step_time: 1473ms, lr: 2.9893716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:22:58,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43069 samples/s/p 5:45:11 } +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 567/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 2.9892959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:01,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43532 samples/s/p 5:44:51 } +2024-07-25 19:23:04,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 569/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9892202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:04,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43594 samples/s/p 5:44:46 } +2024-07-25 19:23:07,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 571/ 1625], loss: 0.978, per_step_time: 1472ms, lr: 2.9891444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:07,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43469 samples/s/p 5:44:47 } +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 573/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 2.9890682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:10,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43942 samples/s/p 5:44:26 } +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 575/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9889916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:13,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.5% |██████ | 5.43354 samples/s/p 5:44:46 } +2024-07-25 19:23:15,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 577/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9889148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:15,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43169 samples/s/p 5:44:50 } +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 579/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9888379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:18,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43898 samples/s/p 5:44:19 } +2024-07-25 19:23:21,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 581/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9887606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:21,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43405 samples/s/p 5:44:35 } +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 583/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.988683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:24,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43389 samples/s/p 5:44:33 } +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 585/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.9886052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:27,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43722 samples/s/p 5:44:17 } +2024-07-25 19:23:30,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 587/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 2.9885274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:30,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42991 samples/s/p 5:44:42 } +2024-07-25 19:23:33,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 589/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.9884488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:33,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43394 samples/s/p 5:44:24 } +2024-07-25 19:23:36,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 591/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9883704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:36,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.43152 samples/s/p 5:44:30 } +2024-07-25 19:23:39,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 593/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.988291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:39,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.6% |██████ | 5.42877 samples/s/p 5:44:37 } +2024-07-25 19:23:42,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 595/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.988212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:42,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43713 samples/s/p 5:44:03 } +2024-07-25 19:23:45,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 597/ 1625], loss: 1.282, per_step_time: 1473ms, lr: 2.9881328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:45,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43092 samples/s/p 5:44:23 } +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 599/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.9880532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:48,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43937 samples/s/p 5:43:48 } +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 601/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 2.9879731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:51,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43495 samples/s/p 5:44:02 } +2024-07-25 19:23:54,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 603/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 2.9878931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:54,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43486 samples/s/p 5:44:00 } +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 605/ 1625], loss: 1.333, per_step_time: 1472ms, lr: 2.9878125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:23:57,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43388 samples/s/p 5:44:00 } +2024-07-25 19:24:00,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 607/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.9877318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:00,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.42980 samples/s/p 5:44:13 } +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 609/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.987651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:03,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.7% |██████ | 5.43226 samples/s/p 5:44:01 } +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 611/ 1625], loss: 1.324, per_step_time: 1473ms, lr: 2.9875695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:06,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43046 samples/s/p 5:44:05 } +2024-07-25 19:24:09,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 613/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.9874882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:09,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43649 samples/s/p 5:43:39 } +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 615/ 1625], loss: 1.271, per_step_time: 1474ms, lr: 2.9874062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:12,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.42677 samples/s/p 5:44:13 } +2024-07-25 19:24:15,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 617/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 2.9873243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:15,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43537 samples/s/p 5:43:37 } +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 619/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.9872419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:17,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43598 samples/s/p 5:43:32 } +2024-07-25 19:24:20,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 621/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.9871593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:20,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43562 samples/s/p 5:43:30 } +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 623/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9870764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:23,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43289 samples/s/p 5:43:38 } +2024-07-25 19:24:26,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 625/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.9869934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:26,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.8% |██████ | 5.43231 samples/s/p 5:43:37 } +2024-07-25 19:24:29,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 627/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.9869097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:29,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43310 samples/s/p 5:43:31 } +2024-07-25 19:24:32,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 629/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.986826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:32,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43442 samples/s/p 5:43:23 } +2024-07-25 19:24:35,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 631/ 1625], loss: 1.349, per_step_time: 1473ms, lr: 2.9867424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:35,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42950 samples/s/p 5:43:39 } +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 633/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.986658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:38,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43637 samples/s/p 5:43:10 } +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 635/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 2.9865738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:41,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43899 samples/s/p 5:42:57 } +2024-07-25 19:24:44,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 637/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.986489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:44,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.43724 samples/s/p 5:43:01 } +2024-07-25 19:24:47,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 639/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 2.9864039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:47,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.44063 samples/s/p 5:42:45 } +2024-07-25 19:24:50,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 641/ 1625], loss: 1.287, per_step_time: 1474ms, lr: 2.9863188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:50,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 13.9% |██████ | 5.42410 samples/s/p 5:43:44 } +2024-07-25 19:24:53,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 643/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9862333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:53,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43349 samples/s/p 5:43:06 } +2024-07-25 19:24:56,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 645/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.9861474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:56,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43527 samples/s/p 5:42:56 } +2024-07-25 19:24:59,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 2.9860614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:24:59,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.44205 samples/s/p 5:42:28 } +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 649/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9859752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:02,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |██████ | 5.43568 samples/s/p 5:42:49 } +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.9858886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:05,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43501 samples/s/p 5:42:48 } +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 653/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.9858018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:08,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43397 samples/s/p 5:42:49 } +2024-07-25 19:25:11,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 655/ 1625], loss: 1.277, per_step_time: 1470ms, lr: 2.9857147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:11,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.43866 samples/s/p 5:42:29 } +2024-07-25 19:25:14,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 657/ 1625], loss: 1.191, per_step_time: 1475ms, lr: 2.9856272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:14,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.0% |███████ | 5.42039 samples/s/p 5:43:35 } +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 659/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.9855397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:17,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43547 samples/s/p 5:42:35 } +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 661/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.9854516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:19,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43301 samples/s/p 5:42:41 } +2024-07-25 19:25:22,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 663/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.9853638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:22,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42815 samples/s/p 5:42:57 } +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 665/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.9852752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:25,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.42973 samples/s/p 5:42:48 } +2024-07-25 19:25:28,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 667/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.9851866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:28,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43606 samples/s/p 5:42:21 } +2024-07-25 19:25:31,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 669/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9850975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:31,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43109 samples/s/p 5:42:37 } +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 671/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.9850084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:34,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43717 samples/s/p 5:42:11 } +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 673/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.984919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:37,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.1% |███████ | 5.43342 samples/s/p 5:42:22 } +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 675/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.9848292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:40,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43393 samples/s/p 5:42:17 } +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 677/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.984739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:43,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43110 samples/s/p 5:42:25 } +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 679/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 2.9846487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:46,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43469 samples/s/p 5:42:08 } +2024-07-25 19:25:49,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 681/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.9845582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:49,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.42863 samples/s/p 5:42:28 } +2024-07-25 19:25:52,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 683/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.9844676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:52,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43106 samples/s/p 5:42:16 } +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 685/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.9843766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:55,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43785 samples/s/p 5:41:48 } +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 687/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.9842851e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:25:58,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43782 samples/s/p 5:41:45 } +2024-07-25 19:26:01,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 689/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9841935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:01,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.2% |███████ | 5.43230 samples/s/p 5:42:03 } +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 691/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 2.9841016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:04,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43044 samples/s/p 5:42:07 } +2024-07-25 19:26:07,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 693/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9840096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:07,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43492 samples/s/p 5:41:47 } +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 695/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 2.9839173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:10,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42797 samples/s/p 5:42:10 } +2024-07-25 19:26:13,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 697/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.9838244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:13,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43246 samples/s/p 5:41:50 } +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 699/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.9837316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:16,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.42886 samples/s/p 5:42:01 } +2024-07-25 19:26:18,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 701/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9836385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:18,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43694 samples/s/p 5:41:27 } +2024-07-25 19:26:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 703/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.9835448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:21,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.44055 samples/s/p 5:41:11 } +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 705/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.9834513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:24,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.3% |███████ | 5.43375 samples/s/p 5:41:34 } +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 707/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.9833573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:27,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43263 samples/s/p 5:41:35 } +2024-07-25 19:26:30,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 709/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.9832629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:30,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43045 samples/s/p 5:41:40 } +2024-07-25 19:26:33,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 711/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.9831685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:33,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43108 samples/s/p 5:41:35 } +2024-07-25 19:26:36,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 713/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.9830737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:36,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43477 samples/s/p 5:41:18 } +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 715/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.9829787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:39,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43535 samples/s/p 5:41:13 } +2024-07-25 19:26:42,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 717/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.9828832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43323 samples/s/p 5:41:18 } +2024-07-25 19:26:45,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 719/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.982788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:45,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43447 samples/s/p 5:41:10 } +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 721/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.982692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:48,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43221 samples/s/p 5:41:16 } +2024-07-25 19:26:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 723/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.982596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.4% |███████ | 5.43167 samples/s/p 5:41:15 } +2024-07-25 19:26:54,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 725/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 2.9824996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43172 samples/s/p 5:41:12 } +2024-07-25 19:26:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 727/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.9824028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:26:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43185 samples/s/p 5:41:08 } +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 729/ 1625], loss: 1.359, per_step_time: 1474ms, lr: 2.9823059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42679 samples/s/p 5:41:25 } +2024-07-25 19:27:03,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 731/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.9822088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:03,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43516 samples/s/p 5:40:50 } +2024-07-25 19:27:06,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 733/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9821114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:06,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43286 samples/s/p 5:40:56 } +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 735/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.9820138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:09,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43784 samples/s/p 5:40:34 } +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 737/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.9819159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:12,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.43449 samples/s/p 5:40:44 } +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 739/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9818177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:15,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.5% |███████ | 5.42936 samples/s/p 5:41:00 } +2024-07-25 19:27:18,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 741/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9817189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:18,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43184 samples/s/p 5:40:48 } +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 743/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.9816205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43155 samples/s/p 5:40:46 } +2024-07-25 19:27:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 745/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.9815214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:23,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.44135 samples/s/p 5:40:06 } +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 747/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.9814222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:26,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43286 samples/s/p 5:40:35 } +2024-07-25 19:27:29,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 749/ 1625], loss: 1.235, per_step_time: 1474ms, lr: 2.9813224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42716 samples/s/p 5:40:54 } +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 751/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.9812229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:32,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.42428 samples/s/p 5:41:02 } +2024-07-25 19:27:35,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 753/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.9811226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:35,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.43238 samples/s/p 5:40:28 } +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 755/ 1625], loss: 1.218, per_step_time: 1482ms, lr: 2.9810224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:38,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.6% |███████ | 5.39807 samples/s/p 5:42:35 } +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 757/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.9809218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:41,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43317 samples/s/p 5:40:19 } +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 759/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.9808209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:44,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42977 samples/s/p 5:40:29 } +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 761/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 2.98072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:47,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43090 samples/s/p 5:40:22 } +2024-07-25 19:27:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 763/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.9806186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42942 samples/s/p 5:40:25 } +2024-07-25 19:27:53,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 765/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9805167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:53,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43539 samples/s/p 5:39:59 } +2024-07-25 19:27:56,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 767/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.9804149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:56,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43303 samples/s/p 5:40:05 } +2024-07-25 19:27:59,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 769/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 2.9803128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:27:59,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.42792 samples/s/p 5:40:21 } +2024-07-25 19:28:02,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 771/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.9802102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:02,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.7% |███████ | 5.43210 samples/s/p 5:40:03 } +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 773/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.9801076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:05,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43436 samples/s/p 5:39:51 } +2024-07-25 19:28:08,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 775/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.9800045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:08,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.44230 samples/s/p 5:39:19 } +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 777/ 1625], loss: 1.292, per_step_time: 1474ms, lr: 2.9799015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:11,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42696 samples/s/p 5:40:13 } +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 779/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.9797979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:14,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43948 samples/s/p 5:39:23 } +2024-07-25 19:28:17,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 781/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.9796942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43458 samples/s/p 5:39:39 } +2024-07-25 19:28:20,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 783/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9795901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:20,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42966 samples/s/p 5:39:54 } +2024-07-25 19:28:23,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 785/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.9794859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:23,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.43488 samples/s/p 5:39:32 } +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 787/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9793813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:25,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.8% |███████ | 5.42794 samples/s/p 5:39:55 } +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 789/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.9792765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:28,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43680 samples/s/p 5:39:19 } +2024-07-25 19:28:31,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 791/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9791714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:31,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43233 samples/s/p 5:39:32 } +2024-07-25 19:28:34,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 793/ 1625], loss: 0.885, per_step_time: 1469ms, lr: 2.979066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:34,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.44272 samples/s/p 5:38:51 } +2024-07-25 19:28:37,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 795/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9789604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:37,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43631 samples/s/p 5:39:12 } +2024-07-25 19:28:40,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 797/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.9788547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:40,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43500 samples/s/p 5:39:14 } +2024-07-25 19:28:43,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 799/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.9787485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:43,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43455 samples/s/p 5:39:12 } +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 801/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 2.978642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43369 samples/s/p 5:39:13 } +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 803/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.9785355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:49,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 14.9% |███████ | 5.43849 samples/s/p 5:38:52 } +2024-07-25 19:28:52,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 805/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.9784285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:52,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43741 samples/s/p 5:38:53 } +2024-07-25 19:28:55,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 807/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9783214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:55,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43667 samples/s/p 5:38:53 } +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 809/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 2.9782139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:28:58,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43348 samples/s/p 5:39:02 } +2024-07-25 19:29:01,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 811/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.9781062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:01,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43784 samples/s/p 5:38:42 } +2024-07-25 19:29:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 813/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.9779982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:04,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.42866 samples/s/p 5:39:14 } +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 815/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.97789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:07,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43516 samples/s/p 5:38:46 } +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 817/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9777813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:10,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43167 samples/s/p 5:38:57 } +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 819/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.9776727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:13,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.0% |███████ | 5.43395 samples/s/p 5:38:45 } +2024-07-25 19:29:16,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 821/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.9775636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:16,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43410 samples/s/p 5:38:42 } +2024-07-25 19:29:19,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 823/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.9774543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:19,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43835 samples/s/p 5:38:23 } +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 825/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9773448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:22,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.44099 samples/s/p 5:38:10 } +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 827/ 1625], loss: 1.146, per_step_time: 1477ms, lr: 2.977235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:24,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.41559 samples/s/p 5:39:42 } +2024-07-25 19:29:27,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 829/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.9771249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:27,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43962 samples/s/p 5:38:09 } +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 831/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.9770146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:30,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43558 samples/s/p 5:38:21 } +2024-07-25 19:29:33,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 833/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.9769039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:33,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43039 samples/s/p 5:38:38 } +2024-07-25 19:29:36,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 835/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.9767929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:36,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.1% |███████ | 5.43784 samples/s/p 5:38:07 } +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 837/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 2.976682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:39,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42976 samples/s/p 5:38:34 } +2024-07-25 19:29:42,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 839/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.9765704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:42,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43579 samples/s/p 5:38:09 } +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 841/ 1625], loss: 0.965, per_step_time: 1472ms, lr: 2.9764587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:45,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43253 samples/s/p 5:38:18 } +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 843/ 1625], loss: 1.341, per_step_time: 1470ms, lr: 2.976347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:48,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43941 samples/s/p 5:37:49 } +2024-07-25 19:29:51,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 845/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9762348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:51,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43016 samples/s/p 5:38:21 } +2024-07-25 19:29:54,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 847/ 1625], loss: 1.444, per_step_time: 1471ms, lr: 2.9761222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:54,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43497 samples/s/p 5:38:00 } +2024-07-25 19:29:57,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 849/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.9760096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:29:57,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43309 samples/s/p 5:38:04 } +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 851/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.9758965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:00,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.43148 samples/s/p 5:38:07 } +2024-07-25 19:30:03,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 853/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9757832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.2% |███████ | 5.42936 samples/s/p 5:38:12 } +2024-07-25 19:30:06,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 855/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.9756698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:06,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43615 samples/s/p 5:37:44 } +2024-07-25 19:30:09,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 857/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.975556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:09,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43422 samples/s/p 5:37:48 } +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 859/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.975442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:12,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43561 samples/s/p 5:37:40 } +2024-07-25 19:30:15,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 861/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.9753279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:15,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43530 samples/s/p 5:37:38 } +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 863/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9752133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:18,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42806 samples/s/p 5:38:02 } +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 865/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9750983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.42550 samples/s/p 5:38:09 } +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 867/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9749832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43687 samples/s/p 5:37:23 } +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 869/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.9748679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:26,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.3% |███████ | 5.43516 samples/s/p 5:37:27 } +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 871/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.9747522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44262 samples/s/p 5:36:56 } +2024-07-25 19:30:32,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 873/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 2.9746365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:32,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43607 samples/s/p 5:37:18 } +2024-07-25 19:30:35,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 875/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.9745202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:35,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43761 samples/s/p 5:37:09 } +2024-07-25 19:30:38,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 877/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.9744038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43488 samples/s/p 5:37:16 } +2024-07-25 19:30:41,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 879/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.9742872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:41,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43340 samples/s/p 5:37:19 } +2024-07-25 19:30:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 881/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9741705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:44,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43705 samples/s/p 5:37:02 } +2024-07-25 19:30:47,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 883/ 1625], loss: 1.387, per_step_time: 1471ms, lr: 2.9740533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:47,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.43662 samples/s/p 5:37:01 } +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 885/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 2.9739356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:50,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.4% |███████ | 5.44139 samples/s/p 5:36:40 } +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 887/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9738178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:53,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43448 samples/s/p 5:37:03 } +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 889/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.9736999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:56,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43804 samples/s/p 5:36:47 } +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 891/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 2.9735816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:30:59,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42880 samples/s/p 5:37:18 } +2024-07-25 19:31:02,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 893/ 1625], loss: 1.258, per_step_time: 1474ms, lr: 2.973463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:02,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42698 samples/s/p 5:37:22 } +2024-07-25 19:31:05,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 895/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.9733445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:05,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43839 samples/s/p 5:36:37 } +2024-07-25 19:31:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 897/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.9732257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:08,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.44038 samples/s/p 5:36:26 } +2024-07-25 19:31:11,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 899/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.973106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.43131 samples/s/p 5:36:57 } +2024-07-25 19:31:14,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 901/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 2.9729865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:14,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.5% |███████ | 5.42888 samples/s/p 5:37:03 } +2024-07-25 19:31:17,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 903/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 2.9728668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:17,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43463 samples/s/p 5:36:39 } +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 905/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.9727466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:20,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43606 samples/s/p 5:36:31 } +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 907/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.9726263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:23,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43607 samples/s/p 5:36:28 } +2024-07-25 19:31:25,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 909/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9725057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:25,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43276 samples/s/p 5:36:37 } +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 911/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.972385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:28,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43889 samples/s/p 5:36:11 } +2024-07-25 19:31:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 913/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.9722638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43541 samples/s/p 5:36:21 } +2024-07-25 19:31:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 915/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 2.9721425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.42911 samples/s/p 5:36:42 } +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 917/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9720208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:37,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.6% |███████ | 5.43730 samples/s/p 5:36:08 } +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 919/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.9718987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:40,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.44149 samples/s/p 5:35:50 } +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 921/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9717767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:43,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43608 samples/s/p 5:36:07 } +2024-07-25 19:31:46,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 923/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9716544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43414 samples/s/p 5:36:11 } +2024-07-25 19:31:49,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 925/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9715315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:49,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43067 samples/s/p 5:36:21 } +2024-07-25 19:31:52,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 927/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.9714083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:52,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43614 samples/s/p 5:35:58 } +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 929/ 1625], loss: 1.329, per_step_time: 1472ms, lr: 2.9712852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:55,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43358 samples/s/p 5:36:04 } +2024-07-25 19:31:58,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 931/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.9711617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:31:58,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.43367 samples/s/p 5:36:01 } +2024-07-25 19:32:01,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 933/ 1625], loss: 1.436, per_step_time: 1473ms, lr: 2.971038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:01,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.7% |███████ | 5.42753 samples/s/p 5:36:21 } +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 935/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.9709141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:04,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.42973 samples/s/p 5:36:10 } +2024-07-25 19:32:07,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 937/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.9707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:07,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43647 samples/s/p 5:35:42 } +2024-07-25 19:32:10,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 939/ 1625], loss: 1.044, per_step_time: 1481ms, lr: 2.9706653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:10,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.40044 samples/s/p 5:37:53 } +2024-07-25 19:32:13,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 941/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.9705405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:13,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43807 samples/s/p 5:35:30 } +2024-07-25 19:32:16,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 943/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.9704153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43276 samples/s/p 5:35:47 } +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 945/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.9702898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:19,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43544 samples/s/p 5:35:34 } +2024-07-25 19:32:22,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 947/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9701643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:22,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43775 samples/s/p 5:35:23 } +2024-07-25 19:32:25,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 949/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.9700386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:25,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.8% |███████ | 5.43455 samples/s/p 5:35:31 } +2024-07-25 19:32:27,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 951/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.9699124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:27,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43154 samples/s/p 5:35:40 } +2024-07-25 19:32:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 953/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 2.9697861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:30,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43512 samples/s/p 5:35:23 } +2024-07-25 19:32:33,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 955/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9696595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:33,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42842 samples/s/p 5:35:45 } +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 957/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.9695326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:36,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42913 samples/s/p 5:35:40 } +2024-07-25 19:32:39,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 959/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9694054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:39,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43187 samples/s/p 5:35:27 } +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 961/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 2.969278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:42,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.43061 samples/s/p 5:35:28 } +2024-07-25 19:32:45,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 2.9691504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:45,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.42992 samples/s/p 5:35:28 } +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 965/ 1625], loss: 1.397, per_step_time: 1483ms, lr: 2.9690224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:48,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 15.9% |███████ | 5.39155 samples/s/p 5:37:48 } +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 967/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.9688941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43504 samples/s/p 5:35:03 } +2024-07-25 19:32:54,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 969/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 2.9687657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:54,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43519 samples/s/p 5:35:00 } +2024-07-25 19:32:57,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 971/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.9686367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:32:57,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43272 samples/s/p 5:35:06 } +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 973/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.9685078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:00,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |███████ | 5.43307 samples/s/p 5:35:02 } +2024-07-25 19:33:03,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 975/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.9683788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:03,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43815 samples/s/p 5:34:40 } +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 977/ 1625], loss: 1.140, per_step_time: 1474ms, lr: 2.9682491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.42617 samples/s/p 5:35:21 } +2024-07-25 19:33:09,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 979/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.9681194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:09,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43805 samples/s/p 5:34:34 } +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 981/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 2.9679892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:12,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43787 samples/s/p 5:34:32 } +2024-07-25 19:33:15,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 983/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.967859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:15,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.0% |████████ | 5.43145 samples/s/p 5:34:53 } +2024-07-25 19:33:18,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 985/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.9677285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:18,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43260 samples/s/p 5:34:46 } +2024-07-25 19:33:21,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 987/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.9675975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:21,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43307 samples/s/p 5:34:41 } +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 989/ 1625], loss: 1.337, per_step_time: 1472ms, lr: 2.9674666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:24,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43219 samples/s/p 5:34:41 } +2024-07-25 19:33:27,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 991/ 1625], loss: 1.347, per_step_time: 1471ms, lr: 2.967335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:27,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43743 samples/s/p 5:34:19 } +2024-07-25 19:33:29,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 993/ 1625], loss: 1.390, per_step_time: 1472ms, lr: 2.9672035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43407 samples/s/p 5:34:28 } +2024-07-25 19:33:32,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 995/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 2.9670717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:32,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43855 samples/s/p 5:34:09 } +2024-07-25 19:33:35,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 997/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.9669396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:35,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43332 samples/s/p 5:34:25 } +2024-07-25 19:33:38,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 999/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 2.9668072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:38,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.1% |████████ | 5.43696 samples/s/p 5:34:09 } +2024-07-25 19:33:41,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1001/ 1625], loss: 0.931, per_step_time: 1471ms, lr: 2.9666744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:41,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43618 samples/s/p 5:34:09 } +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1003/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9665418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:44,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43499 samples/s/p 5:34:10 } +2024-07-25 19:33:47,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1005/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.9664083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:47,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43070 samples/s/p 5:34:23 } +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1007/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 2.966275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:50,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.44242 samples/s/p 5:33:37 } +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1009/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9661414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:53,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43540 samples/s/p 5:34:00 } +2024-07-25 19:33:56,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1011/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.9660072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:56,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43556 samples/s/p 5:33:56 } +2024-07-25 19:33:59,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1013/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.9658731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:33:59,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.42935 samples/s/p 5:34:16 } +2024-07-25 19:34:02,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1015/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.9657387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:02,448 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.2% |████████ | 5.43291 samples/s/p 5:34:00 } +2024-07-25 19:34:05,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1017/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 2.9656037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:05,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.42843 samples/s/p 5:34:14 } +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1019/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 2.9654688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:08,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43960 samples/s/p 5:33:30 } +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1021/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.9653334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:11,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43081 samples/s/p 5:33:59 } +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1023/ 1625], loss: 1.089, per_step_time: 1473ms, lr: 2.9651981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:14,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43096 samples/s/p 5:33:56 } +2024-07-25 19:34:17,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1025/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.965062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:17,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43433 samples/s/p 5:33:40 } +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1027/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 2.964926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:20,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43012 samples/s/p 5:33:53 } +2024-07-25 19:34:23,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1029/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.9647897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:23,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43406 samples/s/p 5:33:35 } +2024-07-25 19:34:26,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1031/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9646533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:26,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.3% |████████ | 5.43247 samples/s/p 5:33:38 } +2024-07-25 19:34:29,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1033/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 2.9645162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:29,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43257 samples/s/p 5:33:35 } +2024-07-25 19:34:31,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1035/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 2.9643794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:31,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43014 samples/s/p 5:33:41 } +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1037/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 2.964242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:34,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43494 samples/s/p 5:33:20 } +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1039/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.9641044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43171 samples/s/p 5:33:29 } +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1041/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.9639665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:40,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43265 samples/s/p 5:33:23 } +2024-07-25 19:34:43,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1043/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.9638284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:43,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43520 samples/s/p 5:33:11 } +2024-07-25 19:34:46,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1045/ 1625], loss: 1.303, per_step_time: 1473ms, lr: 2.96369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:46,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.42952 samples/s/p 5:33:29 } +2024-07-25 19:34:49,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1047/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.9635514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:49,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.4% |████████ | 5.43446 samples/s/p 5:33:07 } +2024-07-25 19:34:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1049/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.9634124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:52,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43824 samples/s/p 5:32:51 } +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1051/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 2.963273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:55,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43404 samples/s/p 5:33:03 } +2024-07-25 19:34:58,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1053/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9631337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:34:58,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43696 samples/s/p 5:32:49 } +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1055/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 2.962994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:01,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44087 samples/s/p 5:32:32 } +2024-07-25 19:35:04,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1057/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.962854e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:04,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.44011 samples/s/p 5:32:32 } +2024-07-25 19:35:07,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1059/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 2.9627137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:07,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43551 samples/s/p 5:32:46 } +2024-07-25 19:35:10,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1061/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9625733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:10,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43161 samples/s/p 5:32:57 } +2024-07-25 19:35:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1063/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.9624325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:13,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.5% |████████ | 5.43866 samples/s/p 5:32:29 } +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1065/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.9622914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:16,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43221 samples/s/p 5:32:49 } +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1067/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9621502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:19,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43400 samples/s/p 5:32:40 } +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1069/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9620089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:22,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43350 samples/s/p 5:32:39 } +2024-07-25 19:35:25,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1071/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.961867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:25,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43595 samples/s/p 5:32:27 } +2024-07-25 19:35:28,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1073/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.961725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:28,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43566 samples/s/p 5:32:25 } +2024-07-25 19:35:30,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1075/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9615825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:30,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.43320 samples/s/p 5:32:31 } +2024-07-25 19:35:33,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1077/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 2.9614399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:33,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.44202 samples/s/p 5:31:56 } +2024-07-25 19:35:36,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1079/ 1625], loss: 1.244, per_step_time: 1475ms, lr: 2.961297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:36,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.6% |████████ | 5.42166 samples/s/p 5:33:07 } +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1081/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.9611541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:39,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.42996 samples/s/p 5:32:34 } +2024-07-25 19:35:42,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1083/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.9610108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:42,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43604 samples/s/p 5:32:09 } +2024-07-25 19:35:45,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1085/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.960867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:45,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43301 samples/s/p 5:32:17 } +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1087/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 2.9607232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:48,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43845 samples/s/p 5:31:54 } +2024-07-25 19:35:51,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1089/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.960579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:51,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43707 samples/s/p 5:31:56 } +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1091/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.9604347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:54,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43425 samples/s/p 5:32:04 } +2024-07-25 19:35:57,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1093/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.96029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:35:57,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.42875 samples/s/p 5:32:21 } +2024-07-25 19:36:00,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1095/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.9601451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:00,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.7% |████████ | 5.43188 samples/s/p 5:32:06 } +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1097/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.96e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:03,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43396 samples/s/p 5:31:56 } +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1099/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.9598543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:06,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42581 samples/s/p 5:32:23 } +2024-07-25 19:36:09,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1101/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.9597088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:09,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43995 samples/s/p 5:31:28 } +2024-07-25 19:36:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1103/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 2.9595627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42806 samples/s/p 5:32:09 } +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1105/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.9594165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:15,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43552 samples/s/p 5:31:38 } +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1107/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.9592702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:18,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43076 samples/s/p 5:31:53 } +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1109/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.9591232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42967 samples/s/p 5:31:54 } +2024-07-25 19:36:24,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.9589763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:24,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.43020 samples/s/p 5:31:49 } +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1113/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 2.958829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.8% |████████ | 5.42958 samples/s/p 5:31:48 } +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1115/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.9586816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:30,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43868 samples/s/p 5:31:12 } +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1117/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 2.9585337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:32,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43094 samples/s/p 5:31:37 } +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1119/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9583858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:35,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43320 samples/s/p 5:31:26 } +2024-07-25 19:36:38,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1121/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9582376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:38,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43353 samples/s/p 5:31:22 } +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1123/ 1625], loss: 1.430, per_step_time: 1471ms, lr: 2.9580888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:41,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43548 samples/s/p 5:31:12 } +2024-07-25 19:36:44,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1125/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.95794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:44,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.43528 samples/s/p 5:31:10 } +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1127/ 1625], loss: 1.177, per_step_time: 1469ms, lr: 2.9577908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:47,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.44479 samples/s/p 5:30:32 } +2024-07-25 19:36:50,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1129/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.9576418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:50,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 16.9% |████████ | 5.42992 samples/s/p 5:31:23 } +2024-07-25 19:36:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9574921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43469 samples/s/p 5:31:03 } +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1133/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.957342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:56,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43052 samples/s/p 5:31:15 } +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1135/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.957192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:36:59,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43647 samples/s/p 5:30:51 } +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1137/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.9570418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:02,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43954 samples/s/p 5:30:36 } +2024-07-25 19:37:05,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1139/ 1625], loss: 1.414, per_step_time: 1472ms, lr: 2.9568911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:05,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43452 samples/s/p 5:30:52 } +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1141/ 1625], loss: 1.430, per_step_time: 1472ms, lr: 2.9567402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:08,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43303 samples/s/p 5:30:54 } +2024-07-25 19:37:11,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1143/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.9565892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:11,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.43561 samples/s/p 5:30:42 } +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1145/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.9564375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:14,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.0% |████████ | 5.44043 samples/s/p 5:30:21 } +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1147/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.956286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:17,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43568 samples/s/p 5:30:36 } +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9561339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:20,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42850 samples/s/p 5:30:59 } +2024-07-25 19:37:23,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1151/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.9559818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:23,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43403 samples/s/p 5:30:36 } +2024-07-25 19:37:26,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1153/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.9558292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:26,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42965 samples/s/p 5:30:49 } +2024-07-25 19:37:29,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1155/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.9556764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:29,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43475 samples/s/p 5:30:27 } +2024-07-25 19:37:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1157/ 1625], loss: 1.392, per_step_time: 1473ms, lr: 2.9555236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:32,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42998 samples/s/p 5:30:42 } +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1159/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9553703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:34,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.43766 samples/s/p 5:30:11 } +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1161/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.955217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:37,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.1% |████████ | 5.42925 samples/s/p 5:30:39 } +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1163/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 2.9550632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:40,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.44204 samples/s/p 5:29:49 } +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1165/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.954909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:43,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.42896 samples/s/p 5:30:34 } +2024-07-25 19:37:46,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1167/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.954755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:46,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43390 samples/s/p 5:30:13 } +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1169/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9546003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:49,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43540 samples/s/p 5:30:04 } +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1171/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.9544455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:52,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43430 samples/s/p 5:30:06 } +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1173/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9542905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43447 samples/s/p 5:30:02 } +2024-07-25 19:37:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1175/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.954135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43456 samples/s/p 5:29:59 } +2024-07-25 19:37:58,573 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 19:38:34,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1177/ 1625], loss: 1.273, per_step_time: 1470ms, lr: 2.9539795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:34,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.2% |████████ | 5.43894 samples/s/p 5:29:40 } +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1179/ 1625], loss: 1.146, per_step_time: 1478ms, lr: 2.9538238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.41155 samples/s/p 5:31:17 } +2024-07-25 19:38:40,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1181/ 1625], loss: 1.283, per_step_time: 1472ms, lr: 2.9536677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:40,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43237 samples/s/p 5:29:58 } +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1183/ 1625], loss: 1.303, per_step_time: 1475ms, lr: 2.9535113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:43,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42266 samples/s/p 5:30:30 } +2024-07-25 19:38:46,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1185/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.9533547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:46,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43236 samples/s/p 5:29:52 } +2024-07-25 19:38:48,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1187/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9531979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:48,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43268 samples/s/p 5:29:48 } +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1189/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9530409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:51,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43811 samples/s/p 5:29:25 } +2024-07-25 19:38:54,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1191/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.9528832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:54,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.43707 samples/s/p 5:29:26 } +2024-07-25 19:38:57,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1193/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.9527255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:38:57,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.3% |████████ | 5.42748 samples/s/p 5:29:58 } +2024-07-25 19:39:00,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1195/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 2.952568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:00,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42977 samples/s/p 5:29:47 } +2024-07-25 19:39:03,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1197/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.9524095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:03,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43275 samples/s/p 5:29:33 } +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1199/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 2.9522513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:06,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43019 samples/s/p 5:29:39 } +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1201/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 2.9520925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:09,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42296 samples/s/p 5:30:03 } +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1203/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 2.9519335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:12,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.44113 samples/s/p 5:28:54 } +2024-07-25 19:39:15,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1205/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.9517743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:15,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42899 samples/s/p 5:29:35 } +2024-07-25 19:39:18,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1207/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.951615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:18,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.42870 samples/s/p 5:29:33 } +2024-07-25 19:39:21,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1209/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.9514551e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:21,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.4% |████████ | 5.43011 samples/s/p 5:29:25 } +2024-07-25 19:39:24,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1211/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9512954e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:24,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43461 samples/s/p 5:29:06 } +2024-07-25 19:39:27,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1213/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.951135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:27,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43369 samples/s/p 5:29:06 } +2024-07-25 19:39:30,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1215/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.9509745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:30,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43715 samples/s/p 5:28:50 } +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1217/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.9508139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:33,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43453 samples/s/p 5:28:57 } +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1219/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.950653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:36,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42604 samples/s/p 5:29:25 } +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1221/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.9504916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:39,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42935 samples/s/p 5:29:10 } +2024-07-25 19:39:42,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1223/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.95033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:42,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.42551 samples/s/p 5:29:21 } +2024-07-25 19:39:45,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1225/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.9501683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:45,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.5% |████████ | 5.43403 samples/s/p 5:28:47 } +2024-07-25 19:39:48,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1227/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.9500063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:48,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42757 samples/s/p 5:29:08 } +2024-07-25 19:39:50,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1229/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.9498437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:50,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43279 samples/s/p 5:28:46 } +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1231/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 2.9496812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:53,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43029 samples/s/p 5:28:52 } +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1233/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9495186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:56,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43363 samples/s/p 5:28:37 } +2024-07-25 19:39:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1235/ 1625], loss: 1.037, per_step_time: 1474ms, lr: 2.9493556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:39:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42590 samples/s/p 5:29:02 } +2024-07-25 19:40:02,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1237/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.9491921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:02,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42715 samples/s/p 5:28:54 } +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1239/ 1625], loss: 1.031, per_step_time: 1487ms, lr: 2.9490286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:05,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.37949 samples/s/p 5:31:46 } +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1241/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.9488647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:08,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.42789 samples/s/p 5:28:46 } +2024-07-25 19:40:11,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1243/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.9487004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:11,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.6% |████████ | 5.43621 samples/s/p 5:28:13 } +2024-07-25 19:40:14,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1474ms, lr: 2.9485363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:14,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42534 samples/s/p 5:28:49 } +2024-07-25 19:40:17,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1247/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.9483715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:17,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42831 samples/s/p 5:28:35 } +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1249/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 2.9482066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:20,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42407 samples/s/p 5:28:48 } +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1251/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.9480416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:23,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43331 samples/s/p 5:28:11 } +2024-07-25 19:40:26,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1253/ 1625], loss: 1.152, per_step_time: 1474ms, lr: 2.9478762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:26,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42618 samples/s/p 5:28:34 } +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1255/ 1625], loss: 1.260, per_step_time: 1475ms, lr: 2.9477103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42339 samples/s/p 5:28:41 } +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1257/ 1625], loss: 1.254, per_step_time: 1473ms, lr: 2.9475446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:32,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.42765 samples/s/p 5:28:23 } +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1259/ 1625], loss: 1.303, per_step_time: 1471ms, lr: 2.9473786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.7% |████████ | 5.43574 samples/s/p 5:27:51 } +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1261/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.947212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:38,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43030 samples/s/p 5:28:08 } +2024-07-25 19:40:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1263/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.9470451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43658 samples/s/p 5:27:42 } +2024-07-25 19:40:44,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1265/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.9468785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:44,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43660 samples/s/p 5:27:39 } +2024-07-25 19:40:47,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1267/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9467114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:47,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43425 samples/s/p 5:27:44 } +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1269/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9465436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:50,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43155 samples/s/p 5:27:51 } +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1271/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.9463761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:53,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43149 samples/s/p 5:27:49 } +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1273/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.9462082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:55,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.43687 samples/s/p 5:27:26 } +2024-07-25 19:40:58,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1275/ 1625], loss: 1.209, per_step_time: 1475ms, lr: 2.94604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:40:58,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.8% |████████ | 5.42354 samples/s/p 5:28:11 } +2024-07-25 19:41:01,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1277/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.9458712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:01,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43944 samples/s/p 5:27:11 } +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1279/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.9457025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:04,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43139 samples/s/p 5:27:37 } +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1281/ 1625], loss: 1.315, per_step_time: 1474ms, lr: 2.9455336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:07,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.42595 samples/s/p 5:27:54 } +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1283/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.9453642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:10,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43166 samples/s/p 5:27:30 } +2024-07-25 19:41:13,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1285/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.9451949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:13,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43973 samples/s/p 5:26:58 } +2024-07-25 19:41:16,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1287/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 2.945025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43935 samples/s/p 5:26:57 } +2024-07-25 19:41:19,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1289/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.944855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:19,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.43122 samples/s/p 5:27:23 } +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1291/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.9446848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:22,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 17.9% |████████ | 5.44098 samples/s/p 5:26:45 } +2024-07-25 19:41:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1293/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9445142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:25,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43138 samples/s/p 5:27:16 } +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1295/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.9443434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43349 samples/s/p 5:27:06 } +2024-07-25 19:41:31,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1297/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.9441722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:31,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.42872 samples/s/p 5:27:20 } +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1299/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.9440009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |████████ | 5.43354 samples/s/p 5:27:00 } +2024-07-25 19:41:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1301/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.9438293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:37,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43778 samples/s/p 5:26:42 } +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1303/ 1625], loss: 1.264, per_step_time: 1474ms, lr: 2.9436576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:40,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.42738 samples/s/p 5:27:16 } +2024-07-25 19:41:43,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1305/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.9434856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:43,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43718 samples/s/p 5:26:38 } +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1307/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.943313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:46,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.0% |█████████ | 5.43572 samples/s/p 5:26:40 } +2024-07-25 19:41:49,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1309/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.9431405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:49,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44116 samples/s/p 5:26:18 } +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1311/ 1625], loss: 1.217, per_step_time: 1469ms, lr: 2.9429677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:52,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.44380 samples/s/p 5:26:05 } +2024-07-25 19:41:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1313/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.9427943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:55,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43486 samples/s/p 5:26:34 } +2024-07-25 19:41:57,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.9426212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:41:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43483 samples/s/p 5:26:32 } +2024-07-25 19:42:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1317/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 2.9424475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43127 samples/s/p 5:26:42 } +2024-07-25 19:42:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1319/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.9422736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:03,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43838 samples/s/p 5:26:13 } +2024-07-25 19:42:06,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1321/ 1625], loss: 1.306, per_step_time: 1472ms, lr: 2.9420993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:06,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43365 samples/s/p 5:26:27 } +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1323/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.941925e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.1% |█████████ | 5.43045 samples/s/p 5:26:36 } +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1325/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.9417504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:12,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43527 samples/s/p 5:26:15 } +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1327/ 1625], loss: 1.301, per_step_time: 1473ms, lr: 2.9415754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:15,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43085 samples/s/p 5:26:28 } +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1329/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.9414003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43637 samples/s/p 5:26:06 } +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1331/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 2.941225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43651 samples/s/p 5:26:02 } +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1333/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.941049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:24,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43159 samples/s/p 5:26:17 } +2024-07-25 19:42:27,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1335/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9408731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:27,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43182 samples/s/p 5:26:13 } +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1337/ 1625], loss: 1.186, per_step_time: 1480ms, lr: 2.940697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:30,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.40244 samples/s/p 5:27:57 } +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1339/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 2.9405206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:33,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.2% |█████████ | 5.43489 samples/s/p 5:25:56 } +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1341/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.9403436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:36,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43457 samples/s/p 5:25:54 } +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1343/ 1625], loss: 1.110, per_step_time: 1474ms, lr: 2.9401668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:39,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42640 samples/s/p 5:26:21 } +2024-07-25 19:42:42,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1345/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.9399896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:42,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43015 samples/s/p 5:26:04 } +2024-07-25 19:42:45,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1347/ 1625], loss: 1.154, per_step_time: 1477ms, lr: 2.939812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:45,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.41581 samples/s/p 5:26:53 } +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1349/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9396344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:48,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43308 samples/s/p 5:25:48 } +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1351/ 1625], loss: 1.387, per_step_time: 1474ms, lr: 2.9394563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:51,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42579 samples/s/p 5:26:11 } +2024-07-25 19:42:54,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1353/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 2.939278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:54,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.42634 samples/s/p 5:26:06 } +2024-07-25 19:42:57,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1355/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 2.9390996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:57,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.3% |█████████ | 5.43049 samples/s/p 5:25:48 } +2024-07-25 19:42:59,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1357/ 1625], loss: 1.159, per_step_time: 1469ms, lr: 2.9389208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:42:59,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.44260 samples/s/p 5:25:02 } +2024-07-25 19:43:02,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1359/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.9387418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:02,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42864 samples/s/p 5:25:49 } +2024-07-25 19:43:05,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1361/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.9385625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:05,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43279 samples/s/p 5:25:31 } +2024-07-25 19:43:08,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1363/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.938383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:08,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43390 samples/s/p 5:25:24 } +2024-07-25 19:43:11,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1365/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.938203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:11,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43654 samples/s/p 5:25:12 } +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1367/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.9380231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:14,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.42901 samples/s/p 5:25:36 } +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1369/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.9378429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:17,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43360 samples/s/p 5:25:17 } +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1371/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.9376622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:20,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43077 samples/s/p 5:25:24 } +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1373/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.9374814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.4% |█████████ | 5.43347 samples/s/p 5:25:11 } +2024-07-25 19:43:26,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1375/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.9373005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:26,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43502 samples/s/p 5:25:03 } +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1377/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.937119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:29,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43218 samples/s/p 5:25:10 } +2024-07-25 19:43:32,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1379/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.9369374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:32,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43272 samples/s/p 5:25:05 } +2024-07-25 19:43:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1381/ 1625], loss: 1.282, per_step_time: 1473ms, lr: 2.9367557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:35,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42792 samples/s/p 5:25:19 } +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1383/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.9365734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:38,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.42795 samples/s/p 5:25:16 } +2024-07-25 19:43:41,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1385/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.9363911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:41,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43710 samples/s/p 5:24:40 } +2024-07-25 19:43:44,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1387/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.9362083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:44,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43146 samples/s/p 5:24:58 } +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1389/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.9360255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:47,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.5% |█████████ | 5.43622 samples/s/p 5:24:38 } +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1391/ 1625], loss: 1.398, per_step_time: 1473ms, lr: 2.9358425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:50,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43100 samples/s/p 5:24:54 } +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1393/ 1625], loss: 1.107, per_step_time: 1477ms, lr: 2.9356592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:53,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41438 samples/s/p 5:25:50 } +2024-07-25 19:43:56,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1395/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.9354755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:56,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42898 samples/s/p 5:24:55 } +2024-07-25 19:43:59,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1397/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 2.9352916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:43:59,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43010 samples/s/p 5:24:48 } +2024-07-25 19:44:02,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1399/ 1625], loss: 1.191, per_step_time: 1477ms, lr: 2.9351077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:02,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.41612 samples/s/p 5:25:35 } +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1401/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.934923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:04,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43527 samples/s/p 5:24:23 } +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1403/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.9347384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:07,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.43610 samples/s/p 5:24:18 } +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1405/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.9345534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:10,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.6% |█████████ | 5.42915 samples/s/p 5:24:40 } +2024-07-25 19:44:13,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1407/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.9343682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:13,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42680 samples/s/p 5:24:45 } +2024-07-25 19:44:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1409/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.9341829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:16,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.44364 samples/s/p 5:23:42 } +2024-07-25 19:44:19,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1411/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.9339972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:19,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43310 samples/s/p 5:24:17 } +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1413/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 2.9338113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:22,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42373 samples/s/p 5:24:47 } +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1415/ 1625], loss: 1.077, per_step_time: 1474ms, lr: 2.9336252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:25,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42564 samples/s/p 5:24:37 } +2024-07-25 19:44:28,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1417/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.9334386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:28,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.43318 samples/s/p 5:24:07 } +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1419/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.933252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:31,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42961 samples/s/p 5:24:17 } +2024-07-25 19:44:34,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1421/ 1625], loss: 1.141, per_step_time: 1474ms, lr: 2.9330648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:34,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.7% |█████████ | 5.42686 samples/s/p 5:24:24 } +2024-07-25 19:44:37,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1423/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9328778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:37,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43284 samples/s/p 5:24:00 } +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1425/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 2.9326904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:40,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43013 samples/s/p 5:24:07 } +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1427/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 2.9325025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:43,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43566 samples/s/p 5:23:44 } +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1429/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 2.9323146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:46,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.42451 samples/s/p 5:24:21 } +2024-07-25 19:44:49,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1431/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.9321263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:49,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43692 samples/s/p 5:23:33 } +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1433/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.9319379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:52,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43634 samples/s/p 5:23:33 } +2024-07-25 19:44:55,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1435/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.931749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:55,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43783 samples/s/p 5:23:24 } +2024-07-25 19:44:58,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1437/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.9315599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:44:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.8% |█████████ | 5.43579 samples/s/p 5:23:29 } +2024-07-25 19:45:01,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1439/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.931371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:01,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43635 samples/s/p 5:23:24 } +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1441/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:04,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43053 samples/s/p 5:23:42 } +2024-07-25 19:45:06,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1443/ 1625], loss: 1.247, per_step_time: 1475ms, lr: 2.9309916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:06,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.42015 samples/s/p 5:24:16 } +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1445/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.9308016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:09,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43383 samples/s/p 5:23:24 } +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1447/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.9306113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:12,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43495 samples/s/p 5:23:17 } +2024-07-25 19:45:15,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1449/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 2.9304209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:15,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43511 samples/s/p 5:23:13 } +2024-07-25 19:45:18,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1451/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.93023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:18,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43615 samples/s/p 5:23:07 } +2024-07-25 19:45:21,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1453/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.930039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:21,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 18.9% |█████████ | 5.43193 samples/s/p 5:23:19 } +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1455/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.9298477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:24,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43434 samples/s/p 5:23:07 } +2024-07-25 19:45:27,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1457/ 1625], loss: 1.217, per_step_time: 1474ms, lr: 2.9296561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:27,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42381 samples/s/p 5:23:42 } +2024-07-25 19:45:30,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1459/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 2.9294642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:30,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43975 samples/s/p 5:22:42 } +2024-07-25 19:45:33,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1461/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.9292723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:33,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42609 samples/s/p 5:23:28 } +2024-07-25 19:45:36,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1463/ 1625], loss: 1.388, per_step_time: 1475ms, lr: 2.9290799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:36,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.42222 samples/s/p 5:23:39 } +2024-07-25 19:45:39,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1465/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.9288873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:39,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43101 samples/s/p 5:23:04 } +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1467/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.9286944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:42,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43682 samples/s/p 5:22:41 } +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1469/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.9285015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:45,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.0% |█████████ | 5.43376 samples/s/p 5:22:49 } +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1471/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.9283083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43428 samples/s/p 5:22:44 } +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1473/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 2.9281146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:51,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43879 samples/s/p 5:22:25 } +2024-07-25 19:45:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1475/ 1625], loss: 1.410, per_step_time: 1472ms, lr: 2.9279207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:54,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43388 samples/s/p 5:22:40 } +2024-07-25 19:45:57,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1477/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.9277267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:45:57,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43192 samples/s/p 5:22:44 } +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1479/ 1625], loss: 1.365, per_step_time: 1473ms, lr: 2.9275321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:00,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43000 samples/s/p 5:22:47 } +2024-07-25 19:46:03,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1481/ 1625], loss: 1.300, per_step_time: 1472ms, lr: 2.9273377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:03,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43247 samples/s/p 5:22:36 } +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1483/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 2.9271429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:06,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43751 samples/s/p 5:22:15 } +2024-07-25 19:46:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1485/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9269479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:08,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.1% |█████████ | 5.43199 samples/s/p 5:22:32 } +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1487/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.9267525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:11,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43721 samples/s/p 5:22:10 } +2024-07-25 19:46:14,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1489/ 1625], loss: 1.286, per_step_time: 1473ms, lr: 2.9265568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:14,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42886 samples/s/p 5:22:37 } +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1491/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.9263609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:17,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43333 samples/s/p 5:22:18 } +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.926165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43330 samples/s/p 5:22:15 } +2024-07-25 19:46:23,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1495/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.9259685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:23,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42765 samples/s/p 5:22:32 } +2024-07-25 19:46:26,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1497/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.9257719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:26,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.42949 samples/s/p 5:22:23 } +2024-07-25 19:46:29,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1499/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.9255749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:29,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43112 samples/s/p 5:22:14 } +2024-07-25 19:46:32,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1501/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.9253777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:32,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43446 samples/s/p 5:21:59 } +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1503/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.9251803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:35,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.2% |█████████ | 5.43854 samples/s/p 5:21:42 } +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1505/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.9249826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:38,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42326 samples/s/p 5:22:33 } +2024-07-25 19:46:41,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1507/ 1625], loss: 0.925, per_step_time: 1474ms, lr: 2.9247849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:41,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42542 samples/s/p 5:22:23 } +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1509/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 2.9245868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:44,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43960 samples/s/p 5:21:29 } +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1511/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.9243884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:47,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42985 samples/s/p 5:22:01 } +2024-07-25 19:46:50,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1513/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.9241895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:50,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.42899 samples/s/p 5:22:01 } +2024-07-25 19:46:53,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1515/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.9239907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:53,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43231 samples/s/p 5:21:46 } +2024-07-25 19:46:56,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1517/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.9237914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43656 samples/s/p 5:21:28 } +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1519/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 2.923592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:46:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.3% |█████████ | 5.43204 samples/s/p 5:21:41 } +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1521/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.9233923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:02,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43501 samples/s/p 5:21:28 } +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1523/ 1625], loss: 1.392, per_step_time: 1471ms, lr: 2.9231926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:05,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43622 samples/s/p 5:21:21 } +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1525/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.9229921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:08,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43255 samples/s/p 5:21:31 } +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1527/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.9227918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43666 samples/s/p 5:21:13 } +2024-07-25 19:47:13,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1529/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.922591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43559 samples/s/p 5:21:14 } +2024-07-25 19:47:16,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1531/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.92239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:16,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43628 samples/s/p 5:21:09 } +2024-07-25 19:47:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1533/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.922189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:19,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.43063 samples/s/p 5:21:26 } +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1535/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 2.9219877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:22,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.4% |█████████ | 5.42846 samples/s/p 5:21:30 } +2024-07-25 19:47:25,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1537/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9217857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:25,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43171 samples/s/p 5:21:16 } +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1539/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.9215838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:28,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43530 samples/s/p 5:21:00 } +2024-07-25 19:47:31,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1541/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 2.9213817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:31,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43174 samples/s/p 5:21:10 } +2024-07-25 19:47:34,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1543/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.9211793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:34,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42981 samples/s/p 5:21:14 } +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1545/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.9209765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:37,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43340 samples/s/p 5:20:58 } +2024-07-25 19:47:40,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1547/ 1625], loss: 1.248, per_step_time: 1474ms, lr: 2.9207737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:40,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42714 samples/s/p 5:21:17 } +2024-07-25 19:47:43,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1549/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.9205703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:43,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.43110 samples/s/p 5:21:00 } +2024-07-25 19:47:46,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1551/ 1625], loss: 1.156, per_step_time: 1474ms, lr: 2.9203668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:46,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.5% |█████████ | 5.42548 samples/s/p 5:21:17 } +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1553/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.920163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:49,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.42831 samples/s/p 5:21:04 } +2024-07-25 19:47:52,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1555/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.9199591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:52,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43020 samples/s/p 5:20:55 } +2024-07-25 19:47:55,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1557/ 1625], loss: 1.030, per_step_time: 1473ms, lr: 2.9197548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:55,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43097 samples/s/p 5:20:49 } +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1559/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.9195504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:47:58,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43200 samples/s/p 5:20:42 } +2024-07-25 19:48:01,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1561/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.9193456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:01,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43431 samples/s/p 5:20:31 } +2024-07-25 19:48:04,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1563/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.9191406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:04,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43656 samples/s/p 5:20:20 } +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1565/ 1625], loss: 1.333, per_step_time: 1486ms, lr: 2.9189354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:07,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.38292 samples/s/p 5:23:29 } +2024-07-25 19:48:10,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1567/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 2.9187298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:10,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.6% |█████████ | 5.43981 samples/s/p 5:20:03 } +2024-07-25 19:48:13,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1569/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.9185241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:13,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43953 samples/s/p 5:20:01 } +2024-07-25 19:48:15,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1571/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.9183184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:15,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43225 samples/s/p 5:20:24 } +2024-07-25 19:48:18,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1573/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.918112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:18,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43852 samples/s/p 5:19:59 } +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1575/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.9179055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:21,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43399 samples/s/p 5:20:12 } +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1577/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.9176985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:24,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43148 samples/s/p 5:20:18 } +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1579/ 1625], loss: 1.100, per_step_time: 1478ms, lr: 2.9174918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:27,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.41150 samples/s/p 5:21:26 } +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1581/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 2.9172843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:30,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.42280 samples/s/p 5:20:43 } +2024-07-25 19:48:33,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1583/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.917077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:33,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.7% |█████████ | 5.43359 samples/s/p 5:20:02 } +2024-07-25 19:48:36,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1585/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.9168692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:36,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.42839 samples/s/p 5:20:17 } +2024-07-25 19:48:39,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1587/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 2.9166611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:39,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43834 samples/s/p 5:19:39 } +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1589/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.916453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:42,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43314 samples/s/p 5:19:54 } +2024-07-25 19:48:45,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1591/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.9162444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:45,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43436 samples/s/p 5:19:47 } +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1593/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.9160356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:48,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43402 samples/s/p 5:19:45 } +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1595/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.9158266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:51,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.44112 samples/s/p 5:19:17 } +2024-07-25 19:48:54,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1597/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.915617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:54,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43436 samples/s/p 5:19:38 } +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1599/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.9154075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:48:57,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.8% |█████████ | 5.43626 samples/s/p 5:19:29 } +2024-07-25 19:49:00,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1601/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.9151977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:00,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42402 samples/s/p 5:20:09 } +2024-07-25 19:49:03,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1603/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.9149878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:03,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43052 samples/s/p 5:19:43 } +2024-07-25 19:49:06,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1605/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 2.9147775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:06,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43180 samples/s/p 5:19:35 } +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1607/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 2.9145669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:09,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43546 samples/s/p 5:19:20 } +2024-07-25 19:49:12,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1609/ 1625], loss: 1.233, per_step_time: 1474ms, lr: 2.914356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:12,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.42618 samples/s/p 5:19:49 } +2024-07-25 19:49:15,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1611/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 2.914145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:15,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43495 samples/s/p 5:19:16 } +2024-07-25 19:49:17,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1613/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9139337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:17,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43099 samples/s/p 5:19:27 } +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1615/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.9137222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:20,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 19.9% |█████████ | 5.43643 samples/s/p 5:19:04 } +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1617/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 2.9135103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:23,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.44226 samples/s/p 5:18:41 } +2024-07-25 19:49:26,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1619/ 1625], loss: 1.271, per_step_time: 1473ms, lr: 2.9132983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:26,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.42916 samples/s/p 5:19:24 } +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1621/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.913086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:29,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43943 samples/s/p 5:18:45 } +2024-07-25 19:49:32,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1623/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.9128734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:32,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |█████████ | 5.43421 samples/s/p 5:19:00 } +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 2/ 10], step:[ 1625/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 2.9126608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:35,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42627 samples/s/p 5:19:26 } +2024-07-25 19:49:38,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 2/ 1625], loss: 1.136, per_step_time: 1475ms, lr: 2.9124476e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:38,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42119 samples/s/p 5:19:41 } +2024-07-25 19:49:41,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 4/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.9122342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:41,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43156 samples/s/p 5:19:01 } +2024-07-25 19:49:44,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 6/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 2.9120209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.42870 samples/s/p 5:19:08 } +2024-07-25 19:49:47,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 8/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.911807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:47,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.0% |██████████ | 5.43172 samples/s/p 5:18:55 } +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 10/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.911593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:50,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42975 samples/s/p 5:18:59 } +2024-07-25 19:49:53,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 12/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9113786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:53,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43366 samples/s/p 5:18:42 } +2024-07-25 19:49:56,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 14/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.911164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:56,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43841 samples/s/p 5:18:22 } +2024-07-25 19:49:59,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 16/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.9109493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:49:59,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42945 samples/s/p 5:18:51 } +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 18/ 1625], loss: 1.293, per_step_time: 1471ms, lr: 2.9107341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:02,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43813 samples/s/p 5:18:17 } +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 20/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.910519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:05,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43381 samples/s/p 5:18:29 } +2024-07-25 19:50:08,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 22/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.9103032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:08,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.42780 samples/s/p 5:18:48 } +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.9100875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:11,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.1% |██████████ | 5.43455 samples/s/p 5:18:21 } +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 26/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.9098714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:14,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43326 samples/s/p 5:18:23 } +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 28/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.9096549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:17,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43806 samples/s/p 5:18:03 } +2024-07-25 19:50:19,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 30/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.9094384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:19,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43316 samples/s/p 5:18:17 } +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 32/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 2.9092214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:22,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42400 samples/s/p 5:18:46 } +2024-07-25 19:50:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 34/ 1625], loss: 1.247, per_step_time: 1474ms, lr: 2.9090043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.42476 samples/s/p 5:18:41 } +2024-07-25 19:50:28,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 36/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 2.9087872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:28,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.44144 samples/s/p 5:17:39 } +2024-07-25 19:50:31,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 38/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.9085697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:31,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43366 samples/s/p 5:18:03 } +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 40/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.9083518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:34,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.2% |██████████ | 5.43400 samples/s/p 5:17:59 } +2024-07-25 19:50:37,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 42/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.9081337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:37,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43356 samples/s/p 5:17:58 } +2024-07-25 19:50:40,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 44/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 2.9079154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:40,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43287 samples/s/p 5:17:57 } +2024-07-25 19:50:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 46/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.9076968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:43,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44014 samples/s/p 5:17:29 } +2024-07-25 19:50:46,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 48/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.9074781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:46,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43112 samples/s/p 5:17:58 } +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 50/ 1625], loss: 1.345, per_step_time: 1469ms, lr: 2.907259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.44281 samples/s/p 5:17:14 } +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 52/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.9070396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:52,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43076 samples/s/p 5:17:53 } +2024-07-25 19:50:55,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 54/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.9068198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:55,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43635 samples/s/p 5:17:31 } +2024-07-25 19:50:58,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 56/ 1625], loss: 1.067, per_step_time: 1473ms, lr: 2.9066001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:50:58,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.3% |██████████ | 5.43106 samples/s/p 5:17:46 } +2024-07-25 19:51:01,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 58/ 1625], loss: 1.227, per_step_time: 1474ms, lr: 2.9063798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:01,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42604 samples/s/p 5:18:01 } +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 60/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.9061597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:04,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43295 samples/s/p 5:17:34 } +2024-07-25 19:51:07,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 62/ 1625], loss: 1.303, per_step_time: 1474ms, lr: 2.9059389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:07,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42477 samples/s/p 5:17:59 } +2024-07-25 19:51:10,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 64/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 2.9057182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:10,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.42886 samples/s/p 5:17:42 } +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 66/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 2.905497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:13,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43054 samples/s/p 5:17:33 } +2024-07-25 19:51:16,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 68/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.9052757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43182 samples/s/p 5:17:26 } +2024-07-25 19:51:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 70/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.9050541e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:19,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43521 samples/s/p 5:17:11 } +2024-07-25 19:51:21,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 72/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.9048324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:21,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.4% |██████████ | 5.43265 samples/s/p 5:17:17 } +2024-07-25 19:51:24,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 74/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.9046103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:24,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43139 samples/s/p 5:17:18 } +2024-07-25 19:51:27,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 76/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.9043878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:27,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43166 samples/s/p 5:17:15 } +2024-07-25 19:51:30,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 78/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.9041654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:30,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43493 samples/s/p 5:17:00 } +2024-07-25 19:51:33,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 80/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.9039425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:33,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42979 samples/s/p 5:17:15 } +2024-07-25 19:51:36,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 82/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.9037194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:36,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43326 samples/s/p 5:17:00 } +2024-07-25 19:51:39,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 84/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.903496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:39,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42780 samples/s/p 5:17:16 } +2024-07-25 19:51:42,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 86/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 2.9032724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:42,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.42156 samples/s/p 5:17:35 } +2024-07-25 19:51:45,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 88/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.9030487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:45,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.5% |██████████ | 5.43844 samples/s/p 5:16:33 } +2024-07-25 19:51:48,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 90/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.9028244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:48,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43253 samples/s/p 5:16:51 } +2024-07-25 19:51:51,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 92/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.9026001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:51,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43687 samples/s/p 5:16:33 } +2024-07-25 19:51:54,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 94/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.9023757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:54,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43507 samples/s/p 5:16:36 } +2024-07-25 19:51:57,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 96/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.9021508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:51:57,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43575 samples/s/p 5:16:31 } +2024-07-25 19:52:00,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 98/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.9019258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:00,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43696 samples/s/p 5:16:24 } +2024-07-25 19:52:03,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 100/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 2.9017005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:03,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.42953 samples/s/p 5:16:47 } +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 102/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.9014749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:06,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43624 samples/s/p 5:16:20 } +2024-07-25 19:52:09,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 104/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.9012492e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:09,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.6% |██████████ | 5.43393 samples/s/p 5:16:25 } +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 106/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.901023e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:12,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43371 samples/s/p 5:16:23 } +2024-07-25 19:52:15,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 108/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.9007966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:15,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43567 samples/s/p 5:16:13 } +2024-07-25 19:52:18,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 110/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.90057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:18,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43568 samples/s/p 5:16:10 } +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 112/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 2.900343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:21,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42866 samples/s/p 5:16:32 } +2024-07-25 19:52:23,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 114/ 1625], loss: 1.314, per_step_time: 1473ms, lr: 2.900116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:23,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42975 samples/s/p 5:16:25 } +2024-07-25 19:52:26,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 116/ 1625], loss: 1.367, per_step_time: 1470ms, lr: 2.8998888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:26,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.44158 samples/s/p 5:15:41 } +2024-07-25 19:52:29,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 118/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 2.899661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:29,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.43273 samples/s/p 5:16:09 } +2024-07-25 19:52:32,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 120/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.8994333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:32,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.7% |██████████ | 5.42764 samples/s/p 5:16:24 } +2024-07-25 19:52:35,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 122/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.8992054e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:35,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43476 samples/s/p 5:15:56 } +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 124/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 2.898977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:38,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43729 samples/s/p 5:15:44 } +2024-07-25 19:52:41,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 126/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.8987482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:41,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43207 samples/s/p 5:15:59 } +2024-07-25 19:52:44,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 128/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8985194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:44,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43357 samples/s/p 5:15:51 } +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 130/ 1625], loss: 1.372, per_step_time: 1473ms, lr: 2.8982906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:47,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43002 samples/s/p 5:16:01 } +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 132/ 1625], loss: 1.306, per_step_time: 1474ms, lr: 2.8980612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:50,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42463 samples/s/p 5:16:17 } +2024-07-25 19:52:53,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 134/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.8978317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:53,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43037 samples/s/p 5:15:54 } +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 136/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.8976017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:56,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.42968 samples/s/p 5:15:53 } +2024-07-25 19:52:59,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 138/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 2.8973716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:52:59,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.8% |██████████ | 5.43903 samples/s/p 5:15:18 } +2024-07-25 19:53:02,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 140/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.8971413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:02,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42984 samples/s/p 5:15:47 } +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 142/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8969109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:05,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43178 samples/s/p 5:15:37 } +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 144/ 1625], loss: 1.292, per_step_time: 1473ms, lr: 2.89668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:08,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42975 samples/s/p 5:15:41 } +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 146/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8964489e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:11,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43414 samples/s/p 5:15:23 } +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 148/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.8962177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:14,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43367 samples/s/p 5:15:22 } +2024-07-25 19:53:17,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 150/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.8959861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.43153 samples/s/p 5:15:26 } +2024-07-25 19:53:20,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 152/ 1625], loss: 1.345, per_step_time: 1473ms, lr: 2.895754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:20,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42883 samples/s/p 5:15:33 } +2024-07-25 19:53:23,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 154/ 1625], loss: 1.245, per_step_time: 1475ms, lr: 2.895522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 20.9% |██████████ | 5.42174 samples/s/p 5:15:54 } +2024-07-25 19:53:25,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 156/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.8952898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:25,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.44035 samples/s/p 5:14:47 } +2024-07-25 19:53:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 158/ 1625], loss: 1.305, per_step_time: 1473ms, lr: 2.8950573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:28,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42876 samples/s/p 5:15:24 } +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 160/ 1625], loss: 1.073, per_step_time: 1474ms, lr: 2.8948245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:31,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.42732 samples/s/p 5:15:26 } +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 162/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.8945915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:34,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43858 samples/s/p 5:14:44 } +2024-07-25 19:53:37,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 164/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.8943581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:37,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43186 samples/s/p 5:15:04 } +2024-07-25 19:53:40,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 166/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.8941244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43650 samples/s/p 5:14:45 } +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 168/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8938906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:43,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43676 samples/s/p 5:14:41 } +2024-07-25 19:53:46,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 170/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.8936567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:46,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.0% |██████████ | 5.43150 samples/s/p 5:14:57 } +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 172/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.8934224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:49,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42311 samples/s/p 5:15:23 } +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 174/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.893188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:52,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43479 samples/s/p 5:14:39 } +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 176/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8929531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:55,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43448 samples/s/p 5:14:37 } +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 178/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.8927181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:53:58,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43358 samples/s/p 5:14:38 } +2024-07-25 19:54:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 180/ 1625], loss: 1.014, per_step_time: 1473ms, lr: 2.892483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.42933 samples/s/p 5:14:49 } +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 182/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.8922472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:04,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43038 samples/s/p 5:14:43 } +2024-07-25 19:54:07,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.8920114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:07,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43282 samples/s/p 5:14:31 } +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 186/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.8917755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.1% |██████████ | 5.43401 samples/s/p 5:14:24 } +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 188/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 2.8915392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:13,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43810 samples/s/p 5:14:07 } +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 190/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.8913028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:16,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.44200 samples/s/p 5:13:51 } +2024-07-25 19:54:19,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 192/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.891066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:19,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43188 samples/s/p 5:14:23 } +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 194/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.890829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:22,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43662 samples/s/p 5:14:04 } +2024-07-25 19:54:25,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 196/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.8905917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:25,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43956 samples/s/p 5:13:50 } +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 198/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 2.8903542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43733 samples/s/p 5:13:55 } +2024-07-25 19:54:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 200/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.8901162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43450 samples/s/p 5:14:02 } +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 202/ 1625], loss: 0.911, per_step_time: 1472ms, lr: 2.8898783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.2% |██████████ | 5.43217 samples/s/p 5:14:07 } +2024-07-25 19:54:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 204/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.8896402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43197 samples/s/p 5:14:05 } +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 206/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.8894017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:39,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42648 samples/s/p 5:14:21 } +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 208/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 2.8891629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.44029 samples/s/p 5:13:30 } +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 210/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 2.8889239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:45,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42629 samples/s/p 5:14:16 } +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 212/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.8886847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43561 samples/s/p 5:13:41 } +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 214/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 2.8884451e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:51,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.42644 samples/s/p 5:14:09 } +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 216/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.8882056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:54,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43666 samples/s/p 5:13:31 } +2024-07-25 19:54:57,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 218/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 2.8879656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:54:57,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.3% |██████████ | 5.43341 samples/s/p 5:13:39 } +2024-07-25 19:55:00,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 220/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.8877253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:00,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43668 samples/s/p 5:13:25 } +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 222/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8874847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:03,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43463 samples/s/p 5:13:29 } +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 224/ 1625], loss: 1.312, per_step_time: 1474ms, lr: 2.8872442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:06,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42654 samples/s/p 5:13:54 } +2024-07-25 19:55:09,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 226/ 1625], loss: 1.336, per_step_time: 1474ms, lr: 2.8870032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:09,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42567 samples/s/p 5:13:54 } +2024-07-25 19:55:12,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 228/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 2.8867618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:12,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43407 samples/s/p 5:13:22 } +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 230/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.8865205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:15,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.43227 samples/s/p 5:13:26 } +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 232/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 2.8862785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:18,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42817 samples/s/p 5:13:37 } +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 234/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 2.8860366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:21,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.4% |██████████ | 5.42685 samples/s/p 5:13:39 } +2024-07-25 19:55:24,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 236/ 1625], loss: 1.114, per_step_time: 1475ms, lr: 2.8857945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:24,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.42354 samples/s/p 5:13:47 } +2024-07-25 19:55:27,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 238/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.8855518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:27,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43291 samples/s/p 5:13:12 } +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 240/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 2.8853092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:29,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43221 samples/s/p 5:13:11 } +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 242/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.8850664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:32,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43867 samples/s/p 5:12:46 } +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 244/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 2.8848232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:35,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43527 samples/s/p 5:12:55 } +2024-07-25 19:55:38,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 246/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 2.8845798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:38,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43921 samples/s/p 5:12:38 } +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 248/ 1625], loss: 1.535, per_step_time: 1470ms, lr: 2.884336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:41,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43878 samples/s/p 5:12:37 } +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 250/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.884092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:44,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.5% |██████████ | 5.43392 samples/s/p 5:12:50 } +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 252/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.883848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:47,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43447 samples/s/p 5:12:46 } +2024-07-25 19:55:50,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 254/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8836035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:50,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43716 samples/s/p 5:12:33 } +2024-07-25 19:55:53,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 256/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 2.8833589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:53,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43827 samples/s/p 5:12:27 } +2024-07-25 19:55:56,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 258/ 1625], loss: 1.371, per_step_time: 1472ms, lr: 2.883114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:56,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43351 samples/s/p 5:12:40 } +2024-07-25 19:55:59,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 260/ 1625], loss: 1.411, per_step_time: 1474ms, lr: 2.8828688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:55:59,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42717 samples/s/p 5:12:59 } +2024-07-25 19:56:02,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 262/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.8826234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:02,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43100 samples/s/p 5:12:43 } +2024-07-25 19:56:05,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 264/ 1625], loss: 1.197, per_step_time: 1474ms, lr: 2.8823779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:05,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42670 samples/s/p 5:12:55 } +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 266/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.8821318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:08,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.42944 samples/s/p 5:12:42 } +2024-07-25 19:56:11,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 268/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.8818857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:11,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.6% |██████████ | 5.43974 samples/s/p 5:12:04 } +2024-07-25 19:56:14,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 270/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.8816394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:14,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43761 samples/s/p 5:12:08 } +2024-07-25 19:56:17,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 272/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 2.8813927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:17,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43447 samples/s/p 5:12:16 } +2024-07-25 19:56:20,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 274/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.8811459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:20,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43406 samples/s/p 5:12:15 } +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 276/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 2.8808987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:23,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42539 samples/s/p 5:12:42 } +2024-07-25 19:56:26,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 278/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.8806513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:26,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42807 samples/s/p 5:12:29 } +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 280/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.8804037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:29,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43611 samples/s/p 5:11:59 } +2024-07-25 19:56:31,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 282/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.8801558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:31,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.42942 samples/s/p 5:12:19 } +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 284/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.8799077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:34,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.7% |██████████ | 5.43753 samples/s/p 5:11:48 } +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 286/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 2.8796594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:37,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43682 samples/s/p 5:11:48 } +2024-07-25 19:56:40,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 288/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.8794107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:40,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43798 samples/s/p 5:11:41 } +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 290/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.879162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:43,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43482 samples/s/p 5:11:48 } +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 292/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 2.8789127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:46,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43516 samples/s/p 5:11:44 } +2024-07-25 19:56:49,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 294/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.8786633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:49,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43645 samples/s/p 5:11:37 } +2024-07-25 19:56:52,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 296/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8784138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:52,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43521 samples/s/p 5:11:38 } +2024-07-25 19:56:55,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 298/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8781642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:55,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43232 samples/s/p 5:11:45 } +2024-07-25 19:56:58,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 300/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8779139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:56:58,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.8% |██████████ | 5.43892 samples/s/p 5:11:20 } +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 302/ 1625], loss: 1.402, per_step_time: 1470ms, lr: 2.8776638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:01,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43888 samples/s/p 5:11:17 } +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 304/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.8774133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:04,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42777 samples/s/p 5:11:52 } +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 306/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.8771623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:07,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43157 samples/s/p 5:11:36 } +2024-07-25 19:57:10,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 308/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.8769113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:10,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43817 samples/s/p 5:11:10 } +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 310/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.87666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:13,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42765 samples/s/p 5:11:44 } +2024-07-25 19:57:16,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 312/ 1625], loss: 1.311, per_step_time: 1473ms, lr: 2.8764085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:16,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43059 samples/s/p 5:11:31 } +2024-07-25 19:57:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 314/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 2.8761566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.42396 samples/s/p 5:11:51 } +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 316/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.8759046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:22,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 21.9% |██████████ | 5.43418 samples/s/p 5:11:12 } +2024-07-25 19:57:25,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 318/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8756524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:25,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43293 samples/s/p 5:11:14 } +2024-07-25 19:57:28,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 320/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.8753999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43571 samples/s/p 5:11:01 } +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 322/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.875147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:30,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.43196 samples/s/p 5:11:11 } +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 324/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8748942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:33,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |██████████ | 5.42765 samples/s/p 5:11:23 } +2024-07-25 19:57:36,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 326/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 2.8746406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:36,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43927 samples/s/p 5:10:40 } +2024-07-25 19:57:39,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 328/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 2.8743872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:39,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43268 samples/s/p 5:11:00 } +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 330/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.8741335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:42,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43241 samples/s/p 5:10:58 } +2024-07-25 19:57:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 332/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.8738794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:45,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.0% |███████████ | 5.43779 samples/s/p 5:10:36 } +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 334/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.8736255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:48,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43383 samples/s/p 5:10:47 } +2024-07-25 19:57:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 336/ 1625], loss: 1.295, per_step_time: 1473ms, lr: 2.8733708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:51,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43062 samples/s/p 5:10:55 } +2024-07-25 19:57:54,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 338/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 2.8731161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:54,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43225 samples/s/p 5:10:47 } +2024-07-25 19:57:57,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 340/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.8728611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:57:57,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43157 samples/s/p 5:10:46 } +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 342/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.872606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:00,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43705 samples/s/p 5:10:24 } +2024-07-25 19:58:03,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 344/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.8723503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:03,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43020 samples/s/p 5:10:45 } +2024-07-25 19:58:06,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 346/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 2.8720948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:06,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.43036 samples/s/p 5:10:41 } +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 348/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.871839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.1% |███████████ | 5.42995 samples/s/p 5:10:40 } +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 350/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 2.8715825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:12,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.44026 samples/s/p 5:10:02 } +2024-07-25 19:58:15,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 352/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.8713264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:15,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43190 samples/s/p 5:10:27 } +2024-07-25 19:58:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 354/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 2.8710696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:18,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43670 samples/s/p 5:10:08 } +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 356/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.8708128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43213 samples/s/p 5:10:21 } +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 358/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.8705555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:24,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43308 samples/s/p 5:10:14 } +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 360/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 2.8702983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:27,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43942 samples/s/p 5:09:50 } +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 362/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8700404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:30,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43816 samples/s/p 5:09:51 } +2024-07-25 19:58:32,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 364/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 2.8697825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:32,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.2% |███████████ | 5.43982 samples/s/p 5:09:42 } +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 366/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.8695245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:35,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43813 samples/s/p 5:09:45 } +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 368/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.869266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:38,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43594 samples/s/p 5:09:50 } +2024-07-25 19:58:41,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 370/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.8690074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:41,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42827 samples/s/p 5:10:13 } +2024-07-25 19:58:44,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 372/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 2.8687486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:44,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43310 samples/s/p 5:09:54 } +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 374/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.8684895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:47,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43742 samples/s/p 5:09:36 } +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 376/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 2.8682301e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:50,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43602 samples/s/p 5:09:38 } +2024-07-25 19:58:53,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 378/ 1625], loss: 1.099, per_step_time: 1475ms, lr: 2.8679706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:53,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.42208 samples/s/p 5:10:23 } +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 380/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.8677106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:56,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.3% |███████████ | 5.43236 samples/s/p 5:09:44 } +2024-07-25 19:58:59,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 382/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.8674505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:58:59,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43374 samples/s/p 5:09:37 } +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 384/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 2.8671904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:02,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43073 samples/s/p 5:09:44 } +2024-07-25 19:59:05,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 386/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.8669298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:05,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43328 samples/s/p 5:09:32 } +2024-07-25 19:59:08,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 388/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 2.8666691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:08,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43020 samples/s/p 5:09:40 } +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 390/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.866408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:11,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43390 samples/s/p 5:09:24 } +2024-07-25 19:59:14,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 392/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.8661465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:14,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.44099 samples/s/p 5:08:57 } +2024-07-25 19:59:17,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 394/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.865885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:17,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43174 samples/s/p 5:09:26 } +2024-07-25 19:59:20,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 396/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8656234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:20,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43507 samples/s/p 5:09:12 } +2024-07-25 19:59:23,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 398/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.8653612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:23,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.4% |███████████ | 5.43255 samples/s/p 5:09:17 } +2024-07-25 19:59:26,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 400/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 2.865099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:26,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42967 samples/s/p 5:09:24 } +2024-07-25 19:59:29,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 402/ 1625], loss: 0.941, per_step_time: 1470ms, lr: 2.8648365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:29,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43991 samples/s/p 5:08:46 } +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 404/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.8645738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:32,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43793 samples/s/p 5:08:50 } +2024-07-25 19:59:34,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 406/ 1625], loss: 0.998, per_step_time: 1472ms, lr: 2.8643106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:34,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43203 samples/s/p 5:09:07 } +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 408/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 2.8640474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:37,919 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.42657 samples/s/p 5:09:23 } +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 410/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.863784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:40,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43442 samples/s/p 5:08:53 } +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 412/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.8635202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:43,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43501 samples/s/p 5:08:48 } +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 414/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.8632563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:46,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.5% |███████████ | 5.43088 samples/s/p 5:08:59 } +2024-07-25 19:59:49,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 416/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.8629922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:49,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43935 samples/s/p 5:08:28 } +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 418/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.8627277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43362 samples/s/p 5:08:44 } +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 420/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.8624629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:55,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43798 samples/s/p 5:08:26 } +2024-07-25 19:59:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 422/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.862198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 19:59:58,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44009 samples/s/p 5:08:16 } +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 424/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.8619328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:01,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44152 samples/s/p 5:08:08 } +2024-07-25 20:00:04,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 426/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.8616674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:04,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43421 samples/s/p 5:08:30 } +2024-07-25 20:00:07,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 428/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.8614015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:07,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.44107 samples/s/p 5:08:04 } +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 430/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.8611357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:10,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.6% |███████████ | 5.43415 samples/s/p 5:08:25 } +2024-07-25 20:00:13,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 432/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.8608694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:13,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43738 samples/s/p 5:08:11 } +2024-07-25 20:00:16,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 434/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.8606033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:16,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.44001 samples/s/p 5:07:59 } +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 436/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.8603366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:19,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43366 samples/s/p 5:08:18 } +2024-07-25 20:00:22,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 438/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.8600698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:22,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43160 samples/s/p 5:08:22 } +2024-07-25 20:00:25,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 440/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.8598026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:25,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43921 samples/s/p 5:07:53 } +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 442/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8595354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:28,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43164 samples/s/p 5:08:16 } +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 444/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.8592678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:31,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.43434 samples/s/p 5:08:03 } +2024-07-25 20:00:33,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 446/ 1625], loss: 1.317, per_step_time: 1473ms, lr: 2.8589999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:33,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.7% |███████████ | 5.42897 samples/s/p 5:08:19 } +2024-07-25 20:00:36,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 448/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.858732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:36,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43410 samples/s/p 5:07:58 } +2024-07-25 20:00:39,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 450/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.8584634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:39,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43396 samples/s/p 5:07:56 } +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 452/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.858195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:42,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43027 samples/s/p 5:08:06 } +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 454/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.8579261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:45,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43879 samples/s/p 5:07:34 } +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 456/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.857657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:48,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42888 samples/s/p 5:08:04 } +2024-07-25 20:00:51,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.8573877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:51,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42972 samples/s/p 5:07:59 } +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 460/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.8571181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:54,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.42833 samples/s/p 5:08:00 } +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 462/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.8568486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:00:57,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.8% |███████████ | 5.43499 samples/s/p 5:07:35 } +2024-07-25 20:01:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 464/ 1625], loss: 1.383, per_step_time: 1473ms, lr: 2.8565784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43002 samples/s/p 5:07:49 } +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 466/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.8563083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:03,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.44076 samples/s/p 5:07:09 } +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 468/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 2.8560375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:06,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43652 samples/s/p 5:07:21 } +2024-07-25 20:01:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.8557668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:09,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42883 samples/s/p 5:07:44 } +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 472/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.855496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:12,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43198 samples/s/p 5:07:30 } +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 474/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8552247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43857 samples/s/p 5:07:05 } +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 476/ 1625], loss: 1.055, per_step_time: 1474ms, lr: 2.8549533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:18,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.42416 samples/s/p 5:07:51 } +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 478/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.8546816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 22.9% |███████████ | 5.43272 samples/s/p 5:07:19 } +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 480/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 2.8544096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:24,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43450 samples/s/p 5:07:10 } +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 482/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.8541375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:27,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43418 samples/s/p 5:07:08 } +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 484/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.853865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:30,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43664 samples/s/p 5:06:57 } +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 486/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.8535924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:33,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43540 samples/s/p 5:06:58 } +2024-07-25 20:01:35,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 488/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.8533195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:35,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43535 samples/s/p 5:06:55 } +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 490/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.8530465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:38,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43010 samples/s/p 5:07:10 } +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 492/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.8527731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43424 samples/s/p 5:06:53 } +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 494/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.8524992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:44,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.0% |███████████ | 5.43590 samples/s/p 5:06:45 } +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 496/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.8522254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:47,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43362 samples/s/p 5:06:49 } +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 498/ 1625], loss: 1.339, per_step_time: 1471ms, lr: 2.8519513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:50,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43668 samples/s/p 5:06:36 } +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 500/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 2.8516772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:53,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43705 samples/s/p 5:06:32 } +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 502/ 1625], loss: 1.412, per_step_time: 1474ms, lr: 2.8514025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:56,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.42615 samples/s/p 5:07:06 } +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 504/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 2.8511276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:01:59,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43612 samples/s/p 5:06:29 } +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 506/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 2.8508526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:02,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43106 samples/s/p 5:06:43 } +2024-07-25 20:02:05,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 508/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.8505772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:05,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.44213 samples/s/p 5:06:03 } +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 510/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.8503016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:08,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.1% |███████████ | 5.43192 samples/s/p 5:06:34 } +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 512/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 2.8500259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:11,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43651 samples/s/p 5:06:16 } +2024-07-25 20:02:14,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 514/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 2.8497498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.42774 samples/s/p 5:06:43 } +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 516/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.8494736e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:17,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43740 samples/s/p 5:06:07 } +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 518/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.849197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:20,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43111 samples/s/p 5:06:25 } +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 520/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8489203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:23,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43668 samples/s/p 5:06:04 } +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 522/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.8486435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:26,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43012 samples/s/p 5:06:23 } +2024-07-25 20:02:29,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 524/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 2.848366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:29,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.44004 samples/s/p 5:05:46 } +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 526/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.8480888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:32,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43534 samples/s/p 5:05:59 } +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 528/ 1625], loss: 1.487, per_step_time: 1470ms, lr: 2.8478109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:34,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.2% |███████████ | 5.43965 samples/s/p 5:05:42 } +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 530/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8475331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:37,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43128 samples/s/p 5:06:07 } +2024-07-25 20:02:40,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 532/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.8472548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:40,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43955 samples/s/p 5:05:36 } +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 534/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.8469765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:43,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43319 samples/s/p 5:05:55 } +2024-07-25 20:02:46,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 536/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.8466979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:46,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43578 samples/s/p 5:05:43 } +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 538/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.846419e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:49,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43891 samples/s/p 5:05:30 } +2024-07-25 20:02:52,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 540/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.84614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:52,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43942 samples/s/p 5:05:25 } +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 542/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.8458602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:55,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43759 samples/s/p 5:05:28 } +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 544/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 2.845581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:02:58,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.3% |███████████ | 5.43680 samples/s/p 5:05:28 } +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 546/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 2.8453009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:01,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.42826 samples/s/p 5:05:54 } +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 548/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 2.845021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:04,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43862 samples/s/p 5:05:16 } +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 550/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.8447404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:07,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43533 samples/s/p 5:05:24 } +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 552/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 2.8444598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:10,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43269 samples/s/p 5:05:30 } +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 554/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.8441791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:13,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43576 samples/s/p 5:05:17 } +2024-07-25 20:03:16,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 556/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.843898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:16,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43854 samples/s/p 5:05:04 } +2024-07-25 20:03:19,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 558/ 1625], loss: 1.013, per_step_time: 1469ms, lr: 2.8436167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:19,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.44302 samples/s/p 5:04:46 } +2024-07-25 20:03:22,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 560/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 2.8433353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:22,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.4% |███████████ | 5.43046 samples/s/p 5:05:26 } +2024-07-25 20:03:25,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 562/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 2.8430537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:25,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43087 samples/s/p 5:05:21 } +2024-07-25 20:03:28,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 564/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.8427714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:28,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43855 samples/s/p 5:04:53 } +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 566/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 2.8424893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:31,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43883 samples/s/p 5:04:49 } +2024-07-25 20:03:34,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 568/ 1625], loss: 1.203, per_step_time: 1476ms, lr: 2.8422068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:34,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.41766 samples/s/p 5:05:57 } +2024-07-25 20:03:36,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 570/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.8419241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:36,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43610 samples/s/p 5:04:52 } +2024-07-25 20:03:39,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 572/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.841641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:39,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43833 samples/s/p 5:04:42 } +2024-07-25 20:03:42,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 574/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.8413579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:42,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43273 samples/s/p 5:04:57 } +2024-07-25 20:03:45,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 576/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.8410743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:45,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.5% |███████████ | 5.43516 samples/s/p 5:04:46 } +2024-07-25 20:03:48,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 578/ 1625], loss: 1.349, per_step_time: 1472ms, lr: 2.8407909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:48,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43422 samples/s/p 5:04:47 } +2024-07-25 20:03:51,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 580/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.8405067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:51,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43505 samples/s/p 5:04:41 } +2024-07-25 20:03:54,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 582/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 2.8402226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:54,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43199 samples/s/p 5:04:48 } +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 584/ 1625], loss: 1.113, per_step_time: 1474ms, lr: 2.8399383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:03:57,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.42557 samples/s/p 5:05:07 } +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 586/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 2.8396536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:00,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43132 samples/s/p 5:04:45 } +2024-07-25 20:04:03,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 588/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.8393688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:03,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43633 samples/s/p 5:04:25 } +2024-07-25 20:04:06,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 590/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 2.8390838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:06,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.44198 samples/s/p 5:04:03 } +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 592/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.8387982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:09,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.6% |███████████ | 5.43769 samples/s/p 5:04:14 } +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 594/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.8385126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:12,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43771 samples/s/p 5:04:11 } +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 596/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.8382266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:15,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43360 samples/s/p 5:04:22 } +2024-07-25 20:04:18,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 598/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 2.8379409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:18,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43243 samples/s/p 5:04:23 } +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.8376546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:21,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43530 samples/s/p 5:04:11 } +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 602/ 1625], loss: 1.389, per_step_time: 1471ms, lr: 2.8373679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:24,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43508 samples/s/p 5:04:08 } +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 604/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.8370812e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:27,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43852 samples/s/p 5:03:54 } +2024-07-25 20:04:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 606/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.8367942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:30,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.44091 samples/s/p 5:03:43 } +2024-07-25 20:04:33,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 608/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.836507e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.7% |███████████ | 5.43754 samples/s/p 5:03:51 } +2024-07-25 20:04:35,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 610/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 2.8362196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43870 samples/s/p 5:03:44 } +2024-07-25 20:04:38,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 612/ 1625], loss: 1.135, per_step_time: 1474ms, lr: 2.835932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:38,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42594 samples/s/p 5:04:24 } +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 614/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.8356437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:41,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.42680 samples/s/p 5:04:19 } +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 616/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.8353556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:44,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43486 samples/s/p 5:03:48 } +2024-07-25 20:04:47,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 618/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.8350672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:47,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43745 samples/s/p 5:03:37 } +2024-07-25 20:04:50,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 620/ 1625], loss: 1.351, per_step_time: 1471ms, lr: 2.8347786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:50,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43763 samples/s/p 5:03:33 } +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 622/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.8344895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:53,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.43746 samples/s/p 5:03:31 } +2024-07-25 20:04:56,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 624/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8342007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:56,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.8% |███████████ | 5.44069 samples/s/p 5:03:17 } +2024-07-25 20:04:59,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 626/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.8339113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:04:59,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43066 samples/s/p 5:03:48 } +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 628/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.8336215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:02,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43220 samples/s/p 5:03:40 } +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 630/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.8333317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:05,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42884 samples/s/p 5:03:48 } +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 632/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 2.8330414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:08,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42766 samples/s/p 5:03:49 } +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 634/ 1625], loss: 1.235, per_step_time: 1473ms, lr: 2.8327513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:11,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42887 samples/s/p 5:03:42 } +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 636/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.8324606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.42937 samples/s/p 5:03:37 } +2024-07-25 20:05:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 638/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 2.83217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:17,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43548 samples/s/p 5:03:14 } +2024-07-25 20:05:20,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 640/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.831879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:20,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 23.9% |███████████ | 5.43470 samples/s/p 5:03:14 } +2024-07-25 20:05:23,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 642/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.8315875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:23,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43852 samples/s/p 5:02:58 } +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 644/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 2.831296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:26,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42843 samples/s/p 5:03:29 } +2024-07-25 20:05:29,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 646/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.8310042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:29,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.43702 samples/s/p 5:02:57 } +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 648/ 1625], loss: 1.377, per_step_time: 1474ms, lr: 2.8307122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:32,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |███████████ | 5.42662 samples/s/p 5:03:29 } +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 650/ 1625], loss: 1.391, per_step_time: 1470ms, lr: 2.8304199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:35,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.44107 samples/s/p 5:02:38 } +2024-07-25 20:05:37,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 652/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.8301274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:37,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43767 samples/s/p 5:02:46 } +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 654/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 2.8298351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:40,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.42823 samples/s/p 5:03:15 } +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 656/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 2.829542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:43,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43788 samples/s/p 5:02:40 } +2024-07-25 20:05:46,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 658/ 1625], loss: 1.197, per_step_time: 1470ms, lr: 2.829249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:46,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.0% |████████████ | 5.43969 samples/s/p 5:02:31 } +2024-07-25 20:05:49,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 660/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 2.8289556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:49,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43659 samples/s/p 5:02:38 } +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 662/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.828662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:52,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43547 samples/s/p 5:02:39 } +2024-07-25 20:05:55,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 664/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 2.8283679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:55,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43114 samples/s/p 5:02:50 } +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 666/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.8280738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:05:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43294 samples/s/p 5:02:41 } +2024-07-25 20:06:01,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 668/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.8277795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:01,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43431 samples/s/p 5:02:34 } +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 670/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 2.827485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:04,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43956 samples/s/p 5:02:13 } +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 672/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.8271901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43667 samples/s/p 5:02:20 } +2024-07-25 20:06:10,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 674/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.826895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:10,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.1% |████████████ | 5.43495 samples/s/p 5:02:23 } +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 676/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.8265997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:13,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43898 samples/s/p 5:02:06 } +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 678/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.826304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:16,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43149 samples/s/p 5:02:28 } +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 680/ 1625], loss: 1.368, per_step_time: 1473ms, lr: 2.8260083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:19,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43023 samples/s/p 5:02:30 } +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 682/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.8257125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:22,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43383 samples/s/p 5:02:15 } +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 684/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.8254162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:25,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43475 samples/s/p 5:02:09 } +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 686/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.8251197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:28,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.44170 samples/s/p 5:01:43 } +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 688/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.8248229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:31,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.43164 samples/s/p 5:02:13 } +2024-07-25 20:06:34,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 690/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.824526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:34,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.2% |████████████ | 5.42769 samples/s/p 5:02:24 } +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 692/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.8242288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:36,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43357 samples/s/p 5:02:01 } +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 694/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.8239314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:39,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43129 samples/s/p 5:02:06 } +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 696/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.8236338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:42,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43622 samples/s/p 5:01:46 } +2024-07-25 20:06:45,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 698/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 2.823336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:45,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43056 samples/s/p 5:02:02 } +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 700/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.8230377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:48,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43268 samples/s/p 5:01:52 } +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 702/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.8227394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:51,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43264 samples/s/p 5:01:49 } +2024-07-25 20:06:54,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 704/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 2.8224411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:54,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.42985 samples/s/p 5:01:56 } +2024-07-25 20:06:57,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 706/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 2.822142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:06:57,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.3% |████████████ | 5.43609 samples/s/p 5:01:32 } +2024-07-25 20:07:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 708/ 1625], loss: 1.182, per_step_time: 1474ms, lr: 2.8218434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42556 samples/s/p 5:02:04 } +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 710/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.821544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42995 samples/s/p 5:01:46 } +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.8212444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43452 samples/s/p 5:01:28 } +2024-07-25 20:07:09,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 714/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.8209444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:09,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43522 samples/s/p 5:01:23 } +2024-07-25 20:07:12,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 716/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.8206448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:12,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43996 samples/s/p 5:01:04 } +2024-07-25 20:07:15,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 718/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.8203443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:15,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.42590 samples/s/p 5:01:48 } +2024-07-25 20:07:18,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 720/ 1625], loss: 1.027, per_step_time: 1473ms, lr: 2.8200438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:18,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43070 samples/s/p 5:01:29 } +2024-07-25 20:07:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 722/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.8197432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:21,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.4% |████████████ | 5.43763 samples/s/p 5:01:03 } +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 724/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8194423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:24,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43948 samples/s/p 5:00:54 } +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 726/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.819141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:27,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43553 samples/s/p 5:01:04 } +2024-07-25 20:07:30,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 728/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.8188399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:30,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.42995 samples/s/p 5:01:20 } +2024-07-25 20:07:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 730/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.818538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:33,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43123 samples/s/p 5:01:13 } +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 732/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.8182361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:36,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43613 samples/s/p 5:00:54 } +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 734/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.817934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43411 samples/s/p 5:00:57 } +2024-07-25 20:07:41,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 736/ 1625], loss: 1.435, per_step_time: 1471ms, lr: 2.8176317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:41,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43524 samples/s/p 5:00:51 } +2024-07-25 20:07:44,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 738/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.817329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:44,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.5% |████████████ | 5.43301 samples/s/p 5:00:55 } +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 740/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.8170265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:47,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.44003 samples/s/p 5:00:29 } +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 742/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.8167233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:50,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43603 samples/s/p 5:00:39 } +2024-07-25 20:07:53,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 744/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.8164202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:53,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43324 samples/s/p 5:00:45 } +2024-07-25 20:07:56,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 746/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.8161166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:56,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43634 samples/s/p 5:00:32 } +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 748/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.8158129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:07:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43221 samples/s/p 5:00:43 } +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 750/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.815509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:02,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43827 samples/s/p 5:00:20 } +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 752/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.8152048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43003 samples/s/p 5:00:44 } +2024-07-25 20:08:08,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 754/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 2.8149003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.6% |████████████ | 5.43919 samples/s/p 5:00:11 } +2024-07-25 20:08:11,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 756/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.8145956e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:11,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43507 samples/s/p 5:00:22 } +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 758/ 1625], loss: 1.360, per_step_time: 1471ms, lr: 2.8142907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:14,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43743 samples/s/p 5:00:11 } +2024-07-25 20:08:17,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 760/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.8139855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:17,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43053 samples/s/p 5:00:31 } +2024-07-25 20:08:20,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 762/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.8136801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:20,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43613 samples/s/p 5:00:09 } +2024-07-25 20:08:23,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 764/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.8133745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:23,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43257 samples/s/p 5:00:18 } +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 766/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.8130687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:26,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43665 samples/s/p 5:00:02 } +2024-07-25 20:08:29,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 768/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 2.8127626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43238 samples/s/p 5:00:13 } +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 770/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.8124563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.7% |████████████ | 5.43168 samples/s/p 5:00:12 } +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 772/ 1625], loss: 1.004, per_step_time: 1470ms, lr: 2.8121498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:35,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43856 samples/s/p 4:59:47 } +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 774/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.8118431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:37,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44205 samples/s/p 4:59:32 } +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 776/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.811536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:40,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43989 samples/s/p 4:59:36 } +2024-07-25 20:08:43,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 778/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 2.8112287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:43,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43875 samples/s/p 4:59:37 } +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 780/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.8109214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:46,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43972 samples/s/p 4:59:31 } +2024-07-25 20:08:49,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 782/ 1625], loss: 1.063, per_step_time: 1473ms, lr: 2.8106135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:49,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43007 samples/s/p 5:00:00 } +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 784/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 2.8103057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:52,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43257 samples/s/p 4:59:49 } +2024-07-25 20:08:55,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 786/ 1625], loss: 1.206, per_step_time: 1469ms, lr: 2.8099974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:55,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.44467 samples/s/p 4:59:06 } +2024-07-25 20:08:58,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 788/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.8096889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:08:58,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.8% |████████████ | 5.43456 samples/s/p 4:59:36 } +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 790/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.8093804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:01,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43868 samples/s/p 4:59:20 } +2024-07-25 20:09:04,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 792/ 1625], loss: 1.290, per_step_time: 1471ms, lr: 2.8090715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:04,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43609 samples/s/p 4:59:25 } +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 794/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.8087625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:07,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43783 samples/s/p 4:59:17 } +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 796/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.8084534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:10,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43193 samples/s/p 4:59:33 } +2024-07-25 20:09:13,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 798/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.8081437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:13,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.42980 samples/s/p 4:59:37 } +2024-07-25 20:09:16,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 800/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.8078339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:16,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43866 samples/s/p 4:59:05 } +2024-07-25 20:09:19,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 802/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.8075237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:19,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43121 samples/s/p 4:59:27 } +2024-07-25 20:09:22,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 804/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.8072136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:22,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 24.9% |████████████ | 5.43057 samples/s/p 4:59:26 } +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 806/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 2.8069033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:25,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43309 samples/s/p 4:59:15 } +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 808/ 1625], loss: 1.130, per_step_time: 1469ms, lr: 2.8065924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44285 samples/s/p 4:58:40 } +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 810/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.8062814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:31,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43258 samples/s/p 4:59:10 } +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 812/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.8059701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:34,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43859 samples/s/p 4:58:48 } +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 814/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 2.8056587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:36,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43601 samples/s/p 4:58:53 } +2024-07-25 20:09:39,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 816/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.8053471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:39,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.43938 samples/s/p 4:58:39 } +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.8050354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:42,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.42973 samples/s/p 4:59:08 } +2024-07-25 20:09:45,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 820/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 2.8047232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:45,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.0% |████████████ | 5.44120 samples/s/p 4:58:27 } +2024-07-25 20:09:48,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 822/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.8044109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:48,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42674 samples/s/p 4:59:12 } +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 824/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.8040982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43389 samples/s/p 4:58:46 } +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 826/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.8037857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43457 samples/s/p 4:58:40 } +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 828/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 2.8034725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:09:57,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43981 samples/s/p 4:58:20 } +2024-07-25 20:10:00,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 830/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.8031593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.42790 samples/s/p 4:58:56 } +2024-07-25 20:10:03,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 832/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.8028457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:03,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43787 samples/s/p 4:58:21 } +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 834/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 2.802532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:06,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43983 samples/s/p 4:58:11 } +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 836/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.8022181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:09,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.1% |████████████ | 5.43163 samples/s/p 4:58:35 } +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 838/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 2.8019038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:12,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42725 samples/s/p 4:58:47 } +2024-07-25 20:10:15,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 840/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.8015895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:15,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43778 samples/s/p 4:58:09 } +2024-07-25 20:10:18,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 842/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 2.8012748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:18,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43444 samples/s/p 4:58:17 } +2024-07-25 20:10:21,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 844/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 2.80096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:21,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44467 samples/s/p 4:57:41 } +2024-07-25 20:10:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 846/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 2.8006447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:24,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43946 samples/s/p 4:57:55 } +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 848/ 1625], loss: 1.213, per_step_time: 1474ms, lr: 2.8003293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:27,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.42721 samples/s/p 4:58:32 } +2024-07-25 20:10:30,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 850/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.8000139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:30,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.43248 samples/s/p 4:58:12 } +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 852/ 1625], loss: 1.193, per_step_time: 1469ms, lr: 2.799698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:33,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.2% |████████████ | 5.44384 samples/s/p 4:57:32 } +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 854/ 1625], loss: 1.300, per_step_time: 1470ms, lr: 2.7993821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:36,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43960 samples/s/p 4:57:43 } +2024-07-25 20:10:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 856/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 2.7990658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43378 samples/s/p 4:57:59 } +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 858/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.7987491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:41,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43378 samples/s/p 4:57:56 } +2024-07-25 20:10:44,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 860/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7984324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:44,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43330 samples/s/p 4:57:54 } +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 862/ 1625], loss: 1.279, per_step_time: 1470ms, lr: 2.7981154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:47,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.44203 samples/s/p 4:57:23 } +2024-07-25 20:10:50,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 864/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.7977982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:50,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43331 samples/s/p 4:57:49 } +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 866/ 1625], loss: 0.923, per_step_time: 1470ms, lr: 2.7974807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:53,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.43998 samples/s/p 4:57:24 } +2024-07-25 20:10:56,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 868/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 2.7971631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:56,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.3% |████████████ | 5.42778 samples/s/p 4:58:01 } +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 870/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.7968452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:10:59,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.42990 samples/s/p 4:57:51 } +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 872/ 1625], loss: 1.453, per_step_time: 1472ms, lr: 2.7965272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:02,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43464 samples/s/p 4:57:32 } +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 874/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7962087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:05,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43201 samples/s/p 4:57:38 } +2024-07-25 20:11:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 876/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.7958902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:08,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43411 samples/s/p 4:57:28 } +2024-07-25 20:11:11,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 878/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.7955713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:11,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43085 samples/s/p 4:57:36 } +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 880/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7952523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:14,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43588 samples/s/p 4:57:17 } +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 882/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.794933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:17,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.43618 samples/s/p 4:57:13 } +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 884/ 1625], loss: 1.304, per_step_time: 1477ms, lr: 2.7946136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.4% |████████████ | 5.41634 samples/s/p 4:58:15 } +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 886/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 2.7942939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:23,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43762 samples/s/p 4:57:02 } +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 888/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.7939739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:26,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.42942 samples/s/p 4:57:26 } +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 890/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7936538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:29,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43389 samples/s/p 4:57:08 } +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 892/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7933336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:32,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43326 samples/s/p 4:57:07 } +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 894/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.7930128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:35,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.44209 samples/s/p 4:56:36 } +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 896/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.7926919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:37,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43296 samples/s/p 4:57:03 } +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 898/ 1625], loss: 1.071, per_step_time: 1473ms, lr: 2.7923708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:40,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43089 samples/s/p 4:57:06 } +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 900/ 1625], loss: 1.450, per_step_time: 1472ms, lr: 2.7920494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:43,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.5% |████████████ | 5.43437 samples/s/p 4:56:52 } +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7917278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:46,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43631 samples/s/p 4:56:43 } +2024-07-25 20:11:49,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 904/ 1625], loss: 1.411, per_step_time: 1472ms, lr: 2.791406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43367 samples/s/p 4:56:48 } +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 906/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 2.791084e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:52,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43996 samples/s/p 4:56:25 } +2024-07-25 20:11:55,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 908/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 2.7907618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:55,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43799 samples/s/p 4:56:28 } +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 910/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.7904392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:11:58,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43909 samples/s/p 4:56:22 } +2024-07-25 20:12:01,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 912/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.7901167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:01,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.42816 samples/s/p 4:56:55 } +2024-07-25 20:12:04,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 914/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.7897937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:04,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43662 samples/s/p 4:56:24 } +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 916/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.7894706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:07,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43192 samples/s/p 4:56:37 } +2024-07-25 20:12:10,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 918/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7891474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:10,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.6% |████████████ | 5.43201 samples/s/p 4:56:33 } +2024-07-25 20:12:13,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 920/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 2.7888234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:13,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.44069 samples/s/p 4:56:02 } +2024-07-25 20:12:16,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 922/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.7884998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:16,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43146 samples/s/p 4:56:29 } +2024-07-25 20:12:19,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 924/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.7881757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:19,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43847 samples/s/p 4:56:03 } +2024-07-25 20:12:22,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 926/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.7878514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:22,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43601 samples/s/p 4:56:08 } +2024-07-25 20:12:25,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 928/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.7875269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:25,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43629 samples/s/p 4:56:05 } +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 930/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 2.7872022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:28,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43583 samples/s/p 4:56:03 } +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 932/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.7868771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:31,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43701 samples/s/p 4:55:56 } +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 934/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.7865519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:34,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.7% |████████████ | 5.43926 samples/s/p 4:55:46 } +2024-07-25 20:12:36,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 936/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.7862265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:36,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43863 samples/s/p 4:55:45 } +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 938/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.7859009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43311 samples/s/p 4:56:00 } +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 940/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.7855749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43719 samples/s/p 4:55:44 } +2024-07-25 20:12:45,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 942/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.7852488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:45,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43560 samples/s/p 4:55:46 } +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 944/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.7849223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:48,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43667 samples/s/p 4:55:40 } +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 946/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 2.7845957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:51,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43897 samples/s/p 4:55:29 } +2024-07-25 20:12:54,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 948/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.7842689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:54,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43184 samples/s/p 4:55:50 } +2024-07-25 20:12:57,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 950/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.7839418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.8% |████████████ | 5.43721 samples/s/p 4:55:29 } +2024-07-25 20:12:57,652 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 952/ 1625], loss: 1.211, per_step_time: 1570ms, lr: 2.7836148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:33,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.09265 samples/s/p 5:15:26 } +2024-07-25 20:13:35,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 954/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.783287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:35,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43339 samples/s/p 4:55:36 } +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 956/ 1625], loss: 1.364, per_step_time: 1472ms, lr: 2.7829592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:38,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43348 samples/s/p 4:55:33 } +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 958/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.7826314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:41,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43964 samples/s/p 4:55:10 } +2024-07-25 20:13:44,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 960/ 1625], loss: 1.353, per_step_time: 1472ms, lr: 2.7823033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:44,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43436 samples/s/p 4:55:24 } +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 962/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.7819746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:47,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43847 samples/s/p 4:55:07 } +2024-07-25 20:13:50,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 964/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.7816463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:50,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43237 samples/s/p 4:55:24 } +2024-07-25 20:13:53,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 966/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.7813174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:53,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 25.9% |████████████ | 5.43601 samples/s/p 4:55:10 } +2024-07-25 20:13:56,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 968/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.780988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:56,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43976 samples/s/p 4:54:54 } +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 970/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.7806589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:13:59,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43602 samples/s/p 4:55:04 } +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 972/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.7803293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:02,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43241 samples/s/p 4:55:12 } +2024-07-25 20:14:05,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 974/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.7799997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:05,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |████████████ | 5.43179 samples/s/p 4:55:12 } +2024-07-25 20:14:08,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 976/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.7796697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:08,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43285 samples/s/p 4:55:05 } +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 978/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.7793394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:11,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43397 samples/s/p 4:54:59 } +2024-07-25 20:14:14,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 980/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.7790089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:14,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43700 samples/s/p 4:54:46 } +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 982/ 1625], loss: 0.806, per_step_time: 1471ms, lr: 2.7786784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:17,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.0% |█████████████ | 5.43515 samples/s/p 4:54:49 } +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 984/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.7783473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:20,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43705 samples/s/p 4:54:40 } +2024-07-25 20:14:23,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 986/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 2.7780163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:23,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43911 samples/s/p 4:54:30 } +2024-07-25 20:14:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 988/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7776849e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43786 samples/s/p 4:54:31 } +2024-07-25 20:14:29,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 990/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 2.7773533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:29,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43832 samples/s/p 4:54:27 } +2024-07-25 20:14:32,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 992/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.7770213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:32,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43079 samples/s/p 4:54:48 } +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 994/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.7766893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:35,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43352 samples/s/p 4:54:36 } +2024-07-25 20:14:37,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 996/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.7763572e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:37,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43520 samples/s/p 4:54:28 } +2024-07-25 20:14:40,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 998/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 2.7760247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:40,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.1% |█████████████ | 5.43823 samples/s/p 4:54:15 } +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1000/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.7756918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:43,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43248 samples/s/p 4:54:31 } +2024-07-25 20:14:46,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1002/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.775359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:46,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43992 samples/s/p 4:54:04 } +2024-07-25 20:14:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1004/ 1625], loss: 1.410, per_step_time: 1470ms, lr: 2.775026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:49,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.44074 samples/s/p 4:53:58 } +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1006/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.7746924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:52,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43964 samples/s/p 4:53:59 } +2024-07-25 20:14:55,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1008/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 2.7743588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:55,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.42741 samples/s/p 4:54:36 } +2024-07-25 20:14:58,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1010/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.774025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:14:58,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43876 samples/s/p 4:53:56 } +2024-07-25 20:15:01,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1012/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.7736909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:01,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43325 samples/s/p 4:54:11 } +2024-07-25 20:15:04,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1014/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.7733566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:04,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.2% |█████████████ | 5.43831 samples/s/p 4:53:51 } +2024-07-25 20:15:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1016/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 2.7730222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:07,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43244 samples/s/p 4:54:08 } +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1018/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.7726874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:10,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43333 samples/s/p 4:54:02 } +2024-07-25 20:15:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1020/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.7723525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:13,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43940 samples/s/p 4:53:39 } +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1022/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.7720173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:16,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43406 samples/s/p 4:53:53 } +2024-07-25 20:15:19,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1024/ 1625], loss: 1.382, per_step_time: 1474ms, lr: 2.7716818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42624 samples/s/p 4:54:16 } +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1026/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.771346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43067 samples/s/p 4:53:59 } +2024-07-25 20:15:25,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1028/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 2.7710103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:25,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.43528 samples/s/p 4:53:41 } +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1030/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.7706741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:28,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.3% |█████████████ | 5.42797 samples/s/p 4:54:01 } +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1032/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 2.7703378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:31,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.44222 samples/s/p 4:53:12 } +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1034/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7700013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:34,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43529 samples/s/p 4:53:32 } +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 2.7696644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:36,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43962 samples/s/p 4:53:15 } +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1038/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.7693275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:39,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43501 samples/s/p 4:53:27 } +2024-07-25 20:15:42,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1040/ 1625], loss: 1.193, per_step_time: 1474ms, lr: 2.7689903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42491 samples/s/p 4:53:57 } +2024-07-25 20:15:45,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1042/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 2.7686527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:45,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43742 samples/s/p 4:53:13 } +2024-07-25 20:15:48,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1044/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.768315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:48,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.42964 samples/s/p 4:53:35 } +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1046/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.7679771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43545 samples/s/p 4:53:14 } +2024-07-25 20:15:54,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1048/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.7676391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:54,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.4% |█████████████ | 5.43724 samples/s/p 4:53:05 } +2024-07-25 20:15:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1050/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7673008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:15:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43587 samples/s/p 4:53:06 } +2024-07-25 20:16:00,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1052/ 1625], loss: 1.420, per_step_time: 1472ms, lr: 2.766962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:00,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43226 samples/s/p 4:53:15 } +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1054/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 2.7666232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:03,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.44091 samples/s/p 4:52:44 } +2024-07-25 20:16:06,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1056/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.766284e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:06,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42960 samples/s/p 4:53:18 } +2024-07-25 20:16:09,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1058/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.765945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:09,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43827 samples/s/p 4:52:47 } +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1060/ 1625], loss: 1.163, per_step_time: 1473ms, lr: 2.7656057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:12,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.42993 samples/s/p 4:53:11 } +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1062/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.7652659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:15,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43147 samples/s/p 4:53:03 } +2024-07-25 20:16:18,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1064/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 2.764926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:18,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.5% |█████████████ | 5.43067 samples/s/p 4:53:03 } +2024-07-25 20:16:21,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1066/ 1625], loss: 1.355, per_step_time: 1471ms, lr: 2.764586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:21,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43658 samples/s/p 4:52:41 } +2024-07-25 20:16:24,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1068/ 1625], loss: 1.314, per_step_time: 1473ms, lr: 2.7642454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:24,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.42778 samples/s/p 4:53:06 } +2024-07-25 20:16:27,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1070/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.763905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43622 samples/s/p 4:52:36 } +2024-07-25 20:16:30,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1072/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.763564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:30,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43222 samples/s/p 4:52:46 } +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1074/ 1625], loss: 1.086, per_step_time: 1482ms, lr: 2.7632228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:33,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.39698 samples/s/p 4:54:38 } +2024-07-25 20:16:36,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1076/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.7628816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:36,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43479 samples/s/p 4:52:32 } +2024-07-25 20:16:38,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1078/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 2.7625401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:38,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43717 samples/s/p 4:52:21 } +2024-07-25 20:16:41,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1080/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.7621985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:41,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.6% |█████████████ | 5.43885 samples/s/p 4:52:13 } +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1082/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.7618566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:44,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43455 samples/s/p 4:52:24 } +2024-07-25 20:16:47,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1084/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 2.7615144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:47,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42983 samples/s/p 4:52:36 } +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1086/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.7611719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:50,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43304 samples/s/p 4:52:23 } +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1088/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 2.7608294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42615 samples/s/p 4:52:42 } +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1090/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.7604865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:56,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43786 samples/s/p 4:52:01 } +2024-07-25 20:16:59,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1092/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.7601433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:16:59,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43462 samples/s/p 4:52:09 } +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1094/ 1625], loss: 1.117, per_step_time: 1475ms, lr: 2.7598004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:02,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.42181 samples/s/p 4:52:47 } +2024-07-25 20:17:05,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1096/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7594568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:05,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.7% |█████████████ | 5.43403 samples/s/p 4:52:05 } +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1098/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 2.759113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:08,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43397 samples/s/p 4:52:02 } +2024-07-25 20:17:11,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1100/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.758769e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:11,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43805 samples/s/p 4:51:46 } +2024-07-25 20:17:14,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1102/ 1625], loss: 1.244, per_step_time: 1473ms, lr: 2.7584249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:14,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43028 samples/s/p 4:52:08 } +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1104/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 2.7580805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:17,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43582 samples/s/p 4:51:47 } +2024-07-25 20:17:20,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1106/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.7577358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:20,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43857 samples/s/p 4:51:35 } +2024-07-25 20:17:23,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1108/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.7573911e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.42958 samples/s/p 4:52:01 } +2024-07-25 20:17:26,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1110/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.7570459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43456 samples/s/p 4:51:42 } +2024-07-25 20:17:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1112/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 2.7567006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:29,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.8% |█████████████ | 5.43887 samples/s/p 4:51:25 } +2024-07-25 20:17:32,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1114/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.756355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:32,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43659 samples/s/p 4:51:30 } +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1116/ 1625], loss: 1.316, per_step_time: 1470ms, lr: 2.7560092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:35,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.44099 samples/s/p 4:51:13 } +2024-07-25 20:17:38,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1118/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 2.7556633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43008 samples/s/p 4:51:45 } +2024-07-25 20:17:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1120/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.7553173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43322 samples/s/p 4:51:32 } +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1122/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 2.7549708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:43,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42693 samples/s/p 4:51:49 } +2024-07-25 20:17:46,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1124/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.754624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:46,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43033 samples/s/p 4:51:35 } +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1126/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.7542774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:49,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.42905 samples/s/p 4:51:36 } +2024-07-25 20:17:52,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1128/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.7539303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:52,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 26.9% |█████████████ | 5.43414 samples/s/p 4:51:17 } +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1130/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.7535827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:55,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43941 samples/s/p 4:50:57 } +2024-07-25 20:17:58,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1132/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 2.7532353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:17:58,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.44271 samples/s/p 4:50:44 } +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1134/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 2.7528875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43720 samples/s/p 4:50:58 } +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1136/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.7525399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:04,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43448 samples/s/p 4:51:04 } +2024-07-25 20:18:07,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1138/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.7521915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:07,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43153 samples/s/p 4:51:11 } +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1140/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.751843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:10,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43627 samples/s/p 4:50:53 } +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1142/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.7514943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:13,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43588 samples/s/p 4:50:51 } +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1144/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.7511456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.0% |█████████████ | 5.43316 samples/s/p 4:50:57 } +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1146/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.7507964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:19,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43961 samples/s/p 4:50:33 } +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1148/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.7504475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:22,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43516 samples/s/p 4:50:44 } +2024-07-25 20:18:25,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1150/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 2.7500977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:25,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43029 samples/s/p 4:50:57 } +2024-07-25 20:18:28,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1152/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 2.7497483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:28,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43992 samples/s/p 4:50:23 } +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1154/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.749398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.44043 samples/s/p 4:50:19 } +2024-07-25 20:18:34,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1156/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 2.7490478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:34,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43933 samples/s/p 4:50:19 } +2024-07-25 20:18:37,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1158/ 1625], loss: 1.337, per_step_time: 1473ms, lr: 2.7486976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:37,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43032 samples/s/p 4:50:45 } +2024-07-25 20:18:39,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1160/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.7483471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:40,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.1% |█████████████ | 5.43780 samples/s/p 4:50:18 } +2024-07-25 20:18:42,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1162/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.7479962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:42,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43303 samples/s/p 4:50:31 } +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1164/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.747645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43006 samples/s/p 4:50:37 } +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1166/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.7472937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43590 samples/s/p 4:50:16 } +2024-07-25 20:18:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1168/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.7469421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42774 samples/s/p 4:50:39 } +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1170/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.7465905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:54,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43554 samples/s/p 4:50:11 } +2024-07-25 20:18:57,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1172/ 1625], loss: 1.286, per_step_time: 1475ms, lr: 2.7462385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:18:57,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42360 samples/s/p 4:50:46 } +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1174/ 1625], loss: 1.341, per_step_time: 1473ms, lr: 2.7458864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:00,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.43008 samples/s/p 4:50:22 } +2024-07-25 20:19:03,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1176/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.745534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:03,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42855 samples/s/p 4:50:24 } +2024-07-25 20:19:06,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1178/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 2.7451813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:06,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.2% |█████████████ | 5.42860 samples/s/p 4:50:21 } +2024-07-25 20:19:09,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1180/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.7448285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:09,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43267 samples/s/p 4:50:05 } +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1182/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.7444756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:12,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43179 samples/s/p 4:50:05 } +2024-07-25 20:19:15,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.7441221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:15,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43541 samples/s/p 4:49:51 } +2024-07-25 20:19:18,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1186/ 1625], loss: 1.384, per_step_time: 1471ms, lr: 2.7437689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:18,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43626 samples/s/p 4:49:45 } +2024-07-25 20:19:21,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1188/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.7434153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:21,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43662 samples/s/p 4:49:41 } +2024-07-25 20:19:24,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1190/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.7430611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:24,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.44036 samples/s/p 4:49:26 } +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1192/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.742707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:27,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.43168 samples/s/p 4:49:51 } +2024-07-25 20:19:30,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1194/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.7423526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:30,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.3% |█████████████ | 5.42927 samples/s/p 4:49:56 } +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1196/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.7419981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:33,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43244 samples/s/p 4:49:42 } +2024-07-25 20:19:36,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1198/ 1625], loss: 1.360, per_step_time: 1474ms, lr: 2.7416432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:36,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42733 samples/s/p 4:49:56 } +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1200/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.7412882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:39,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43028 samples/s/p 4:49:43 } +2024-07-25 20:19:42,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1202/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.740933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:42,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43453 samples/s/p 4:49:27 } +2024-07-25 20:19:44,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1204/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.7405775e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43638 samples/s/p 4:49:18 } +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1206/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 2.7402219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:47,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43233 samples/s/p 4:49:28 } +2024-07-25 20:19:50,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1208/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 2.7398659e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:50,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.43379 samples/s/p 4:49:21 } +2024-07-25 20:19:53,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1210/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 2.7395097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:53,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.4% |█████████████ | 5.42872 samples/s/p 4:49:34 } +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1212/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 2.7391534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:56,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43792 samples/s/p 4:49:01 } +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1214/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 2.7387967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:19:59,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.42860 samples/s/p 4:49:28 } +2024-07-25 20:20:02,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1216/ 1625], loss: 0.958, per_step_time: 1469ms, lr: 2.73844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:02,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.44478 samples/s/p 4:48:34 } +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1218/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.7380831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:05,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43353 samples/s/p 4:49:07 } +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1220/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.7377257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:08,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43747 samples/s/p 4:48:51 } +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1222/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.7373682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43321 samples/s/p 4:49:02 } +2024-07-25 20:20:14,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1224/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.7370106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:14,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43637 samples/s/p 4:48:49 } +2024-07-25 20:20:17,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1226/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.7366526e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:17,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.5% |█████████████ | 5.43205 samples/s/p 4:49:00 } +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1228/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.7362947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:20,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43557 samples/s/p 4:48:45 } +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1230/ 1625], loss: 1.338, per_step_time: 1469ms, lr: 2.7359361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:23,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.44285 samples/s/p 4:48:19 } +2024-07-25 20:20:26,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1232/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.7355776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:26,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43118 samples/s/p 4:48:53 } +2024-07-25 20:20:29,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1234/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.735219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:29,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43847 samples/s/p 4:48:27 } +2024-07-25 20:20:32,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1236/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.73486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:32,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43544 samples/s/p 4:48:34 } +2024-07-25 20:20:35,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1238/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.734501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.42659 samples/s/p 4:48:59 } +2024-07-25 20:20:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1240/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.7341417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:38,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43296 samples/s/p 4:48:36 } +2024-07-25 20:20:41,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1242/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 2.733782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:41,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.6% |█████████████ | 5.43694 samples/s/p 4:48:20 } +2024-07-25 20:20:43,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1244/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.7334221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:43,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43130 samples/s/p 4:48:35 } +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1246/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.733062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:46,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43621 samples/s/p 4:48:17 } +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1248/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 2.7327018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:49,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43290 samples/s/p 4:48:24 } +2024-07-25 20:20:52,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1250/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.732341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:52,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43170 samples/s/p 4:48:25 } +2024-07-25 20:20:55,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1252/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.7319802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:55,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43800 samples/s/p 4:48:02 } +2024-07-25 20:20:58,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1254/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7316195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:20:58,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43364 samples/s/p 4:48:13 } +2024-07-25 20:21:01,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1256/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.7312582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:01,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43648 samples/s/p 4:48:01 } +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1258/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.7308968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:04,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.7% |█████████████ | 5.43856 samples/s/p 4:47:52 } +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1260/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 2.7305352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:07,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.44032 samples/s/p 4:47:43 } +2024-07-25 20:21:10,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1262/ 1625], loss: 0.940, per_step_time: 1470ms, lr: 2.7301734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:10,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43934 samples/s/p 4:47:43 } +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1264/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.7298112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:13,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43936 samples/s/p 4:47:40 } +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1266/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.729449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:16,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43523 samples/s/p 4:47:51 } +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1268/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 2.729087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:19,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43793 samples/s/p 4:47:39 } +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1270/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.728724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:22,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43310 samples/s/p 4:47:51 } +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1272/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.7283611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:25,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.43617 samples/s/p 4:47:39 } +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1274/ 1625], loss: 1.105, per_step_time: 1482ms, lr: 2.727998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:28,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.8% |█████████████ | 5.39454 samples/s/p 4:49:49 } +2024-07-25 20:21:31,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1276/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.7276346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:31,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43540 samples/s/p 4:47:35 } +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1278/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.7272712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:34,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43448 samples/s/p 4:47:35 } +2024-07-25 20:21:37,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1280/ 1625], loss: 1.093, per_step_time: 1472ms, lr: 2.7269074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:37,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43363 samples/s/p 4:47:35 } +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1282/ 1625], loss: 0.872, per_step_time: 1471ms, lr: 2.7265432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:40,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43726 samples/s/p 4:47:21 } +2024-07-25 20:21:43,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1284/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.7261793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:43,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43668 samples/s/p 4:47:19 } +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1286/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.725815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:45,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.43203 samples/s/p 4:47:31 } +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1288/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.7254502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:48,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.42949 samples/s/p 4:47:36 } +2024-07-25 20:21:51,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1290/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.7250853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:51,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 27.9% |█████████████ | 5.44069 samples/s/p 4:46:58 } +2024-07-25 20:21:54,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1292/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 2.72472e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:54,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.42736 samples/s/p 4:47:37 } +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1294/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.7243548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:21:57,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.42984 samples/s/p 4:47:26 } +2024-07-25 20:22:00,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1296/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.7239892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:00,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43636 samples/s/p 4:47:03 } +2024-07-25 20:22:03,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1298/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 2.7236234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:03,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |█████████████ | 5.43886 samples/s/p 4:46:52 } +2024-07-25 20:22:06,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1300/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.7232578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:06,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43430 samples/s/p 4:47:03 } +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1302/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.7228914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:09,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43773 samples/s/p 4:46:50 } +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1304/ 1625], loss: 1.342, per_step_time: 1477ms, lr: 2.7225251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:12,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.41595 samples/s/p 4:47:56 } +2024-07-25 20:22:15,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1306/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 2.7221586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:15,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43439 samples/s/p 4:46:54 } +2024-07-25 20:22:18,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1308/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.7217915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:18,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.0% |██████████████ | 5.43540 samples/s/p 4:46:48 } +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1310/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.7214248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:21,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43485 samples/s/p 4:46:47 } +2024-07-25 20:22:24,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1312/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.7210575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:24,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43343 samples/s/p 4:46:49 } +2024-07-25 20:22:27,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1314/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 2.7206897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:27,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43930 samples/s/p 4:46:27 } +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1316/ 1625], loss: 1.173, per_step_time: 1474ms, lr: 2.7203223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:30,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42492 samples/s/p 4:47:10 } +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1318/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 2.7199543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:33,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43730 samples/s/p 4:46:27 } +2024-07-25 20:22:36,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1320/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.7195862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:36,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43727 samples/s/p 4:46:25 } +2024-07-25 20:22:39,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1322/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.7192178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:39,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.43268 samples/s/p 4:46:36 } +2024-07-25 20:22:42,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1324/ 1625], loss: 1.350, per_step_time: 1474ms, lr: 2.7188493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:42,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.1% |██████████████ | 5.42728 samples/s/p 4:46:50 } +2024-07-25 20:22:44,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1326/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.7184808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:44,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43734 samples/s/p 4:46:16 } +2024-07-25 20:22:47,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1328/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 2.7181119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:47,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43844 samples/s/p 4:46:09 } +2024-07-25 20:22:50,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1330/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.7177426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:50,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43391 samples/s/p 4:46:20 } +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1332/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 2.7173732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:53,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.44115 samples/s/p 4:45:55 } +2024-07-25 20:22:56,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1334/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7170036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:56,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43581 samples/s/p 4:46:09 } +2024-07-25 20:22:59,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1336/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.7166338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:22:59,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43564 samples/s/p 4:46:06 } +2024-07-25 20:23:02,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1338/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.7162638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:02,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.42702 samples/s/p 4:46:31 } +2024-07-25 20:23:05,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1340/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.7158934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:05,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.2% |██████████████ | 5.43731 samples/s/p 4:45:55 } +2024-07-25 20:23:08,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1342/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.7155229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:08,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43591 samples/s/p 4:45:57 } +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1344/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.7151524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:11,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43814 samples/s/p 4:45:47 } +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1346/ 1625], loss: 0.929, per_step_time: 1472ms, lr: 2.7147813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:14,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43478 samples/s/p 4:45:54 } +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1348/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 2.7144102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:17,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43504 samples/s/p 4:45:50 } +2024-07-25 20:23:20,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1350/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.7140388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:20,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43388 samples/s/p 4:45:51 } +2024-07-25 20:23:23,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1352/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 2.7136673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:23,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43361 samples/s/p 4:45:49 } +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1354/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 2.7132955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:26,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43572 samples/s/p 4:45:39 } +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1356/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.7129236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:29,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.3% |██████████████ | 5.43288 samples/s/p 4:45:45 } +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1358/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 2.7125512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.44037 samples/s/p 4:45:19 } +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1360/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.712179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:35,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43219 samples/s/p 4:45:42 } +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1362/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.7118065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:38,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42878 samples/s/p 4:45:50 } +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1364/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 2.7114334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:41,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43143 samples/s/p 4:45:38 } +2024-07-25 20:23:44,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1366/ 1625], loss: 1.283, per_step_time: 1473ms, lr: 2.7110606e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:44,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.42811 samples/s/p 4:45:46 } +2024-07-25 20:23:46,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1368/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.7106873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:46,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43234 samples/s/p 4:45:29 } +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1370/ 1625], loss: 1.202, per_step_time: 1481ms, lr: 2.7103139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:49,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.40099 samples/s/p 4:47:06 } +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1372/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.70994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:52,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.4% |██████████████ | 5.43650 samples/s/p 4:45:10 } +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.709566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:55,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43620 samples/s/p 4:45:09 } +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1376/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.7091919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:23:58,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42980 samples/s/p 4:45:26 } +2024-07-25 20:24:01,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1378/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 2.7088177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:01,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43436 samples/s/p 4:45:08 } +2024-07-25 20:24:04,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1380/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.7084432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:04,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.42951 samples/s/p 4:45:21 } +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1382/ 1625], loss: 1.086, per_step_time: 1483ms, lr: 2.7080683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:07,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.39209 samples/s/p 4:47:17 } +2024-07-25 20:24:10,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1384/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.7076932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:10,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43503 samples/s/p 4:44:57 } +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1386/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7073182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:13,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43629 samples/s/p 4:44:51 } +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1388/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.7069427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:16,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.5% |██████████████ | 5.43039 samples/s/p 4:45:06 } +2024-07-25 20:24:19,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1390/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.706567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:19,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43094 samples/s/p 4:45:02 } +2024-07-25 20:24:22,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1392/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7061913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:22,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42886 samples/s/p 4:45:05 } +2024-07-25 20:24:25,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1394/ 1625], loss: 1.308, per_step_time: 1474ms, lr: 2.7058151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:25,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42544 samples/s/p 4:45:13 } +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1396/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.705439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:28,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43445 samples/s/p 4:44:42 } +2024-07-25 20:24:31,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1398/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.7050624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:31,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.42934 samples/s/p 4:44:55 } +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1400/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.7046857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:34,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43927 samples/s/p 4:44:21 } +2024-07-25 20:24:37,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1402/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.7043088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:37,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43558 samples/s/p 4:44:29 } +2024-07-25 20:24:40,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1404/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 2.7039318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:40,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.6% |██████████████ | 5.43690 samples/s/p 4:44:22 } +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1406/ 1625], loss: 1.244, per_step_time: 1473ms, lr: 2.7035543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:43,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42810 samples/s/p 4:44:47 } +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1408/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.703177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:46,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43204 samples/s/p 4:44:32 } +2024-07-25 20:24:49,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1410/ 1625], loss: 1.049, per_step_time: 1474ms, lr: 2.702799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:49,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.42625 samples/s/p 4:44:47 } +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1412/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.7024213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:51,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43386 samples/s/p 4:44:20 } +2024-07-25 20:24:54,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1414/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 2.702043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:54,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43730 samples/s/p 4:44:06 } +2024-07-25 20:24:57,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.7016647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:24:57,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43762 samples/s/p 4:44:02 } +2024-07-25 20:25:00,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1418/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7012862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:00,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43660 samples/s/p 4:44:03 } +2024-07-25 20:25:03,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1420/ 1625], loss: 1.196, per_step_time: 1473ms, lr: 2.7009073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:03,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.7% |██████████████ | 5.43017 samples/s/p 4:44:20 } +2024-07-25 20:25:06,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.7005282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:06,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43368 samples/s/p 4:44:06 } +2024-07-25 20:25:09,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1424/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 2.700149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:09,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43361 samples/s/p 4:44:03 } +2024-07-25 20:25:12,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1426/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.6997694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:12,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43697 samples/s/p 4:43:50 } +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1428/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6993897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:15,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43214 samples/s/p 4:44:02 } +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1430/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.69901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:18,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43527 samples/s/p 4:43:49 } +2024-07-25 20:25:21,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1432/ 1625], loss: 1.159, per_step_time: 1475ms, lr: 2.69863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:21,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42368 samples/s/p 4:44:22 } +2024-07-25 20:25:24,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1434/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.6982496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:24,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.43292 samples/s/p 4:43:50 } +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1436/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 2.697869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:27,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.42790 samples/s/p 4:44:03 } +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1438/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 2.6974883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:30,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.8% |██████████████ | 5.44038 samples/s/p 4:43:21 } +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1440/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.6971074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:33,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43340 samples/s/p 4:43:40 } +2024-07-25 20:25:36,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1442/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.6967262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:36,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43765 samples/s/p 4:43:24 } +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1444/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.6963447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:39,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43201 samples/s/p 4:43:39 } +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1446/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 2.6959635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:42,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43287 samples/s/p 4:43:33 } +2024-07-25 20:25:45,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1448/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.6955817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:45,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43410 samples/s/p 4:43:26 } +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1450/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.6951997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:48,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43727 samples/s/p 4:43:13 } +2024-07-25 20:25:50,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1452/ 1625], loss: 1.267, per_step_time: 1470ms, lr: 2.6948175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:50,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.44024 samples/s/p 4:43:01 } +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1454/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 2.6944352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:53,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 28.9% |██████████████ | 5.43603 samples/s/p 4:43:11 } +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1456/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 2.6940525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:56,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.44326 samples/s/p 4:42:46 } +2024-07-25 20:25:59,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1458/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 2.6936696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:25:59,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43200 samples/s/p 4:43:18 } +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1460/ 1625], loss: 1.337, per_step_time: 1471ms, lr: 2.6932865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:02,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43573 samples/s/p 4:43:03 } +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1462/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 2.6929032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:05,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43850 samples/s/p 4:42:52 } +2024-07-25 20:26:08,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1464/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.69252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:08,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42712 samples/s/p 4:43:24 } +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1466/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.6921361e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:11,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.42902 samples/s/p 4:43:16 } +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1468/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 2.6917522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:14,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43471 samples/s/p 4:42:55 } +2024-07-25 20:26:17,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1470/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.691368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:17,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.0% |██████████████ | 5.43390 samples/s/p 4:42:54 } +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1472/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 2.6909836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:20,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.42971 samples/s/p 4:43:05 } +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1474/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.6905991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:23,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43579 samples/s/p 4:42:43 } +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1476/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6902144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:26,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43468 samples/s/p 4:42:43 } +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1478/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 2.6898295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:29,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43023 samples/s/p 4:42:54 } +2024-07-25 20:26:32,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1480/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 2.6894442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:32,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.44323 samples/s/p 4:42:11 } +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1482/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.689059e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:35,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43467 samples/s/p 4:42:34 } +2024-07-25 20:26:38,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1484/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.6886732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:38,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43475 samples/s/p 4:42:31 } +2024-07-25 20:26:41,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1486/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.6882875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:41,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.1% |██████████████ | 5.43890 samples/s/p 4:42:15 } +2024-07-25 20:26:44,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1488/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 2.6879015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:44,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43521 samples/s/p 4:42:24 } +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1490/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 2.6875154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:47,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43344 samples/s/p 4:42:26 } +2024-07-25 20:26:50,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 2.687129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:50,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.42975 samples/s/p 4:42:35 } +2024-07-25 20:26:52,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1494/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.6867421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:52,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43627 samples/s/p 4:42:12 } +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1496/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.6863554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:55,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43970 samples/s/p 4:41:58 } +2024-07-25 20:26:58,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1498/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.6859683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:26:58,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43358 samples/s/p 4:42:14 } +2024-07-25 20:27:01,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1500/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.685581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:01,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43715 samples/s/p 4:42:00 } +2024-07-25 20:27:04,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1502/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.6851938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:04,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.2% |██████████████ | 5.43709 samples/s/p 4:41:57 } +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1504/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.6848062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:07,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43348 samples/s/p 4:42:06 } +2024-07-25 20:27:10,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1506/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.6844182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:10,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43508 samples/s/p 4:41:58 } +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1508/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.68403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:13,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43701 samples/s/p 4:41:49 } +2024-07-25 20:27:16,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1510/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 2.6836418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:16,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.42965 samples/s/p 4:42:09 } +2024-07-25 20:27:19,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1512/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 2.6832533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:19,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43031 samples/s/p 4:42:04 } +2024-07-25 20:27:22,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1514/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.6828646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:22,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43502 samples/s/p 4:41:46 } +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1516/ 1625], loss: 1.383, per_step_time: 1469ms, lr: 2.6824755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.44286 samples/s/p 4:41:19 } +2024-07-25 20:27:28,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1518/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.6820864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:28,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.3% |██████████████ | 5.43735 samples/s/p 4:41:33 } +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1520/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6816972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:31,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43144 samples/s/p 4:41:48 } +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1522/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 2.6813075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:34,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42541 samples/s/p 4:42:04 } +2024-07-25 20:27:37,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1524/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.6809177e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42800 samples/s/p 4:41:53 } +2024-07-25 20:27:40,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1526/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.6805277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:40,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43306 samples/s/p 4:41:35 } +2024-07-25 20:27:43,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1528/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 2.6801375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:43,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43871 samples/s/p 4:41:14 } +2024-07-25 20:27:46,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1530/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.679747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:46,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.42847 samples/s/p 4:41:43 } +2024-07-25 20:27:49,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1532/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 2.6793565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:49,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43492 samples/s/p 4:41:20 } +2024-07-25 20:27:51,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1534/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.6789658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:51,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.4% |██████████████ | 5.43436 samples/s/p 4:41:19 } +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1536/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.6785747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:54,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43225 samples/s/p 4:41:22 } +2024-07-25 20:27:57,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1538/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.6781836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:27:57,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.42478 samples/s/p 4:41:43 } +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1540/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.6777923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:00,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43710 samples/s/p 4:41:01 } +2024-07-25 20:28:03,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1542/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.6774005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:03,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43899 samples/s/p 4:40:53 } +2024-07-25 20:28:06,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1544/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.6770087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:06,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43820 samples/s/p 4:40:52 } +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1546/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 2.6766167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:09,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43302 samples/s/p 4:41:05 } +2024-07-25 20:28:12,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1548/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.6762244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:12,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43344 samples/s/p 4:41:01 } +2024-07-25 20:28:15,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1550/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 2.675832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:15,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.5% |██████████████ | 5.43243 samples/s/p 4:41:01 } +2024-07-25 20:28:18,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1552/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6754393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:18,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43812 samples/s/p 4:40:41 } +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1554/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.6750464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:21,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.42826 samples/s/p 4:41:08 } +2024-07-25 20:28:24,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1556/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.6746531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:24,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43912 samples/s/p 4:40:32 } +2024-07-25 20:28:27,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1558/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 2.67426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:27,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43518 samples/s/p 4:40:41 } +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1560/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.6738662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:30,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43900 samples/s/p 4:40:26 } +2024-07-25 20:28:33,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1562/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.6734724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:33,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43883 samples/s/p 4:40:24 } +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1564/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 2.6730788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:36,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43955 samples/s/p 4:40:19 } +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1566/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.6726846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:39,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43546 samples/s/p 4:40:28 } +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1568/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.67229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:42,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.6% |██████████████ | 5.43795 samples/s/p 4:40:18 } +2024-07-25 20:28:45,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1570/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 2.6718957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:45,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43392 samples/s/p 4:40:27 } +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1572/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.671501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:48,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43184 samples/s/p 4:40:31 } +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1574/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.6711057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:51,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43627 samples/s/p 4:40:14 } +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1576/ 1625], loss: 1.196, per_step_time: 1474ms, lr: 2.6707106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:53,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.42734 samples/s/p 4:40:39 } +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1578/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.6703154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:56,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43783 samples/s/p 4:40:03 } +2024-07-25 20:28:59,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1580/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 2.6699196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:28:59,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.43547 samples/s/p 4:40:08 } +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1582/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.6695237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:02,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44094 samples/s/p 4:39:48 } +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1584/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 2.669128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:05,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.7% |██████████████ | 5.44025 samples/s/p 4:39:47 } +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1586/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 2.6687318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:08,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43486 samples/s/p 4:40:01 } +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1588/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6683352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:11,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43429 samples/s/p 4:39:59 } +2024-07-25 20:29:14,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1590/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.6679389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:14,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43779 samples/s/p 4:39:46 } +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1592/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.667542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:17,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43412 samples/s/p 4:39:54 } +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1594/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.667145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:20,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43143 samples/s/p 4:40:00 } +2024-07-25 20:29:23,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1596/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 2.6667478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:23,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43313 samples/s/p 4:39:51 } +2024-07-25 20:29:26,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1598/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 2.6663502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:26,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43477 samples/s/p 4:39:43 } +2024-07-25 20:29:29,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1600/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.6659527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:29,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.8% |██████████████ | 5.43824 samples/s/p 4:39:30 } +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1602/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 2.6655547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:32,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.42987 samples/s/p 4:39:53 } +2024-07-25 20:29:35,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1604/ 1625], loss: 1.150, per_step_time: 1481ms, lr: 2.6651567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:35,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.39898 samples/s/p 4:41:26 } +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1606/ 1625], loss: 1.109, per_step_time: 1474ms, lr: 2.6647582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:38,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.42736 samples/s/p 4:39:54 } +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1608/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.66436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:41,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43325 samples/s/p 4:39:33 } +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1610/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6639615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:44,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43507 samples/s/p 4:39:25 } +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1612/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 2.6635624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:47,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43837 samples/s/p 4:39:12 } +2024-07-25 20:29:50,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1614/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.6631631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:50,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43164 samples/s/p 4:39:29 } +2024-07-25 20:29:53,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1616/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.6627638e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:53,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 29.9% |██████████████ | 5.43272 samples/s/p 4:39:23 } +2024-07-25 20:29:55,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1618/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.6623644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:55,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43815 samples/s/p 4:39:03 } +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1620/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.6619646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:29:58,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43308 samples/s/p 4:39:16 } +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1622/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.6615648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:01,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43353 samples/s/p 4:39:12 } +2024-07-25 20:30:04,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 3/ 10], step:[ 1624/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.661165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:04,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |██████████████ | 5.43779 samples/s/p 4:38:56 } +2024-07-25 20:30:07,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.6607646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:07,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43424 samples/s/p 4:39:04 } +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 3/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.660364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:10,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43745 samples/s/p 4:38:51 } +2024-07-25 20:30:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 5/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.6599633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:13,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.43699 samples/s/p 4:38:49 } +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 7/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.6595622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:16,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.0% |███████████████ | 5.44031 samples/s/p 4:38:36 } +2024-07-25 20:30:19,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 9/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 2.6591613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:19,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43445 samples/s/p 4:38:51 } +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 11/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 2.6587599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43969 samples/s/p 4:38:32 } +2024-07-25 20:30:25,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 13/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 2.6583582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:25,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.42838 samples/s/p 4:39:04 } +2024-07-25 20:30:28,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 15/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6579564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:28,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43810 samples/s/p 4:38:31 } +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 17/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.6575546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:31,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43385 samples/s/p 4:38:41 } +2024-07-25 20:30:34,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 19/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6571523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:34,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43304 samples/s/p 4:38:41 } +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 21/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.6567499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:37,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43801 samples/s/p 4:38:23 } +2024-07-25 20:30:40,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 23/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 2.6563475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:40,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.1% |███████████████ | 5.43378 samples/s/p 4:38:33 } +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 25/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 2.6559446e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:43,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43263 samples/s/p 4:38:33 } +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 27/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6555417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:46,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43621 samples/s/p 4:38:19 } +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 29/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.6551385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:49,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43539 samples/s/p 4:38:19 } +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 31/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.654735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:52,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43791 samples/s/p 4:38:08 } +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 33/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 2.6543314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:54,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43678 samples/s/p 4:38:09 } +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 35/ 1625], loss: 1.309, per_step_time: 1471ms, lr: 2.6539275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:30:57,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43497 samples/s/p 4:38:11 } +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 37/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.6535236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:00,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43424 samples/s/p 4:38:11 } +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 39/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.6531194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:03,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.2% |███████████████ | 5.43504 samples/s/p 4:38:05 } +2024-07-25 20:31:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 41/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.652715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43175 samples/s/p 4:38:12 } +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 43/ 1625], loss: 1.054, per_step_time: 1473ms, lr: 2.6523103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:09,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43007 samples/s/p 4:38:15 } +2024-07-25 20:31:12,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 45/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.6519056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:12,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43533 samples/s/p 4:37:56 } +2024-07-25 20:31:15,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 47/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.6515005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:15,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43546 samples/s/p 4:37:52 } +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 49/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.6510952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:18,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43122 samples/s/p 4:38:02 } +2024-07-25 20:31:21,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 51/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.6506901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:21,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43558 samples/s/p 4:37:46 } +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 53/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 2.6502841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43920 samples/s/p 4:37:32 } +2024-07-25 20:31:27,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 55/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 2.6498787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:27,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.3% |███████████████ | 5.43105 samples/s/p 4:37:54 } +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 57/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 2.6494725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:30,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43248 samples/s/p 4:37:47 } +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 59/ 1625], loss: 1.363, per_step_time: 1472ms, lr: 2.6490663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:33,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43277 samples/s/p 4:37:43 } +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 61/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.64866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:36,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44011 samples/s/p 4:37:17 } +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 63/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.6482532e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:39,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43291 samples/s/p 4:37:37 } +2024-07-25 20:31:42,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 65/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.6478463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:42,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43547 samples/s/p 4:37:26 } +2024-07-25 20:31:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 67/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 2.6474394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43109 samples/s/p 4:37:36 } +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 69/ 1625], loss: 0.995, per_step_time: 1471ms, lr: 2.6470321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43826 samples/s/p 4:37:11 } +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 71/ 1625], loss: 1.243, per_step_time: 1469ms, lr: 2.6466245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:51,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.44256 samples/s/p 4:36:55 } +2024-07-25 20:31:53,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 73/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 2.6462169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:53,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.4% |███████████████ | 5.43872 samples/s/p 4:37:04 } +2024-07-25 20:31:56,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 75/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.645809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:56,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43844 samples/s/p 4:37:02 } +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 77/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.645401e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:31:59,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43542 samples/s/p 4:37:08 } +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 79/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 2.6449929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:02,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43329 samples/s/p 4:37:12 } +2024-07-25 20:32:05,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 81/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.6445841e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:05,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43174 samples/s/p 4:37:14 } +2024-07-25 20:32:08,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 83/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.6441756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43923 samples/s/p 4:36:48 } +2024-07-25 20:32:11,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 85/ 1625], loss: 0.944, per_step_time: 1472ms, lr: 2.6437665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:11,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43449 samples/s/p 4:36:59 } +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 87/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.6433578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:14,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43478 samples/s/p 4:36:55 } +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 89/ 1625], loss: 0.988, per_step_time: 1472ms, lr: 2.6429483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:17,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.5% |███████████████ | 5.43321 samples/s/p 4:36:57 } +2024-07-25 20:32:20,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 91/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 2.642539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:20,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43665 samples/s/p 4:36:44 } +2024-07-25 20:32:23,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 93/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.6421292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43327 samples/s/p 4:36:51 } +2024-07-25 20:32:26,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 95/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.6417194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:26,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43810 samples/s/p 4:36:34 } +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 97/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 2.6413092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:29,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43355 samples/s/p 4:36:44 } +2024-07-25 20:32:32,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 99/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 2.640899e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:32,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43651 samples/s/p 4:36:33 } +2024-07-25 20:32:35,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 101/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.6404885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:35,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.44023 samples/s/p 4:36:18 } +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 103/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.640078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:38,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43449 samples/s/p 4:36:33 } +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 105/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 2.639667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:41,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.6% |███████████████ | 5.43105 samples/s/p 4:36:40 } +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 107/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.639256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:44,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43792 samples/s/p 4:36:16 } +2024-07-25 20:32:47,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 109/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.6388447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:47,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43630 samples/s/p 4:36:18 } +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 111/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.6384332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:50,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.44304 samples/s/p 4:35:55 } +2024-07-25 20:32:52,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 113/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.6380214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:52,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43724 samples/s/p 4:36:10 } +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 115/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.6376096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:55,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43169 samples/s/p 4:36:24 } +2024-07-25 20:32:58,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 117/ 1625], loss: 1.172, per_step_time: 1474ms, lr: 2.6371974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:32:58,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42526 samples/s/p 4:36:40 } +2024-07-25 20:33:01,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 119/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.6367852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:01,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.42580 samples/s/p 4:36:36 } +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 121/ 1625], loss: 1.315, per_step_time: 1472ms, lr: 2.6363727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:04,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.7% |███████████████ | 5.43376 samples/s/p 4:36:09 } +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 123/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.63596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:07,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43791 samples/s/p 4:35:53 } +2024-07-25 20:33:10,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 125/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.635547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:10,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43584 samples/s/p 4:35:56 } +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 127/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.635134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:13,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43180 samples/s/p 4:36:06 } +2024-07-25 20:33:16,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 129/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 2.6347207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:16,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43975 samples/s/p 4:35:38 } +2024-07-25 20:33:19,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 131/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 2.6343072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:19,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43621 samples/s/p 4:35:46 } +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 133/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.6338936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:22,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43710 samples/s/p 4:35:41 } +2024-07-25 20:33:25,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 135/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 2.6334796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:25,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43049 samples/s/p 4:35:58 } +2024-07-25 20:33:28,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 137/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 2.6330656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:28,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.8% |███████████████ | 5.43860 samples/s/p 4:35:30 } +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 139/ 1625], loss: 1.209, per_step_time: 1474ms, lr: 2.632651e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.42518 samples/s/p 4:36:08 } +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 141/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 2.6322365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:34,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43760 samples/s/p 4:35:27 } +2024-07-25 20:33:37,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 143/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.6318221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:37,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43716 samples/s/p 4:35:26 } +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 145/ 1625], loss: 1.305, per_step_time: 1473ms, lr: 2.631407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:40,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43080 samples/s/p 4:35:42 } +2024-07-25 20:33:43,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 147/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 2.6309921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:43,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43342 samples/s/p 4:35:31 } +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 149/ 1625], loss: 1.344, per_step_time: 1471ms, lr: 2.6305768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:46,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43555 samples/s/p 4:35:22 } +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 151/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 2.6301614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:49,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.43875 samples/s/p 4:35:09 } +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 153/ 1625], loss: 1.080, per_step_time: 1469ms, lr: 2.6297457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:52,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 30.9% |███████████████ | 5.44285 samples/s/p 4:34:54 } +2024-07-25 20:33:54,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 155/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.6293299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:54,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43936 samples/s/p 4:35:01 } +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 157/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.6289135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:33:57,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43760 samples/s/p 4:35:04 } +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 159/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.6284974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:00,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43698 samples/s/p 4:35:03 } +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 161/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 2.6280808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:03,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.43119 samples/s/p 4:35:17 } +2024-07-25 20:34:06,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 163/ 1625], loss: 1.125, per_step_time: 1474ms, lr: 2.6276643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42451 samples/s/p 4:35:35 } +2024-07-25 20:34:09,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 165/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.6272473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.44013 samples/s/p 4:34:44 } +2024-07-25 20:34:12,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 167/ 1625], loss: 1.246, per_step_time: 1474ms, lr: 2.6268302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:12,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42598 samples/s/p 4:35:24 } +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 169/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.6264128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:15,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.0% |███████████████ | 5.42805 samples/s/p 4:35:15 } +2024-07-25 20:34:18,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 171/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.6259953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:18,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43569 samples/s/p 4:34:49 } +2024-07-25 20:34:21,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 173/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6255777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:21,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43419 samples/s/p 4:34:51 } +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 175/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.6251599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:24,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43073 samples/s/p 4:34:58 } +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 177/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.624742e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:27,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43599 samples/s/p 4:34:39 } +2024-07-25 20:34:30,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 179/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 2.6243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:30,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43022 samples/s/p 4:34:54 } +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 181/ 1625], loss: 1.385, per_step_time: 1471ms, lr: 2.6239051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43572 samples/s/p 4:34:34 } +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 183/ 1625], loss: 1.328, per_step_time: 1471ms, lr: 2.6234866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:36,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43789 samples/s/p 4:34:25 } +2024-07-25 20:34:39,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 185/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 2.6230677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:39,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.1% |███████████████ | 5.43079 samples/s/p 4:34:43 } +2024-07-25 20:34:42,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 187/ 1625], loss: 1.128, per_step_time: 1474ms, lr: 2.6226486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:42,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42661 samples/s/p 4:34:53 } +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 189/ 1625], loss: 1.125, per_step_time: 1469ms, lr: 2.6222293e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:45,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.44436 samples/s/p 4:33:56 } +2024-07-25 20:34:48,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 191/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.6218097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:48,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43187 samples/s/p 4:34:31 } +2024-07-25 20:34:51,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 193/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.6213902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:51,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43168 samples/s/p 4:34:29 } +2024-07-25 20:34:54,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 195/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.6209704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:54,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.43346 samples/s/p 4:34:20 } +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 197/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 2.6205502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:56,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42826 samples/s/p 4:34:33 } +2024-07-25 20:34:59,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 199/ 1625], loss: 1.157, per_step_time: 1474ms, lr: 2.6201298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:34:59,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42391 samples/s/p 4:34:44 } +2024-07-25 20:35:02,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 201/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 2.6197094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:02,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42962 samples/s/p 4:34:23 } +2024-07-25 20:35:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 203/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 2.6192887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:05,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.2% |███████████████ | 5.42817 samples/s/p 4:34:25 } +2024-07-25 20:35:08,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 205/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.618868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:08,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43567 samples/s/p 4:33:59 } +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 207/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 2.618447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:11,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43589 samples/s/p 4:33:55 } +2024-07-25 20:35:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 209/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.6180256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:14,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43727 samples/s/p 4:33:48 } +2024-07-25 20:35:17,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 211/ 1625], loss: 1.353, per_step_time: 1471ms, lr: 2.6176042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:17,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43668 samples/s/p 4:33:47 } +2024-07-25 20:35:20,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 213/ 1625], loss: 1.308, per_step_time: 1470ms, lr: 2.6171825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:20,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43951 samples/s/p 4:33:36 } +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 215/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 2.6167607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:23,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43542 samples/s/p 4:33:45 } +2024-07-25 20:35:26,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 217/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.6163387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:26,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43225 samples/s/p 4:33:52 } +2024-07-25 20:35:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 219/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 2.6159165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:29,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.3% |███████████████ | 5.43650 samples/s/p 4:33:36 } +2024-07-25 20:35:32,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 221/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 2.615494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:32,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43679 samples/s/p 4:33:32 } +2024-07-25 20:35:35,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 223/ 1625], loss: 0.978, per_step_time: 1471ms, lr: 2.6150716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:35,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43820 samples/s/p 4:33:25 } +2024-07-25 20:35:38,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 225/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.6146485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:38,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.42895 samples/s/p 4:33:50 } +2024-07-25 20:35:41,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 227/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.6142256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43838 samples/s/p 4:33:18 } +2024-07-25 20:35:44,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 229/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 2.6138026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:44,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43684 samples/s/p 4:33:20 } +2024-07-25 20:35:47,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 231/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.613379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:47,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43785 samples/s/p 4:33:14 } +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 233/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.6129554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:50,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43206 samples/s/p 4:33:29 } +2024-07-25 20:35:53,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 235/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.6125317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:53,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.4% |███████████████ | 5.43672 samples/s/p 4:33:12 } +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.6121077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:55,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43585 samples/s/p 4:33:11 } +2024-07-25 20:35:58,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 239/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.6116835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:35:58,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43521 samples/s/p 4:33:10 } +2024-07-25 20:36:01,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 241/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.611259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:01,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43530 samples/s/p 4:33:07 } +2024-07-25 20:36:04,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 243/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.6108346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:04,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43139 samples/s/p 4:33:16 } +2024-07-25 20:36:07,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.6104097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:07,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43596 samples/s/p 4:32:59 } +2024-07-25 20:36:10,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 247/ 1625], loss: 1.326, per_step_time: 1473ms, lr: 2.6099848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:10,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43069 samples/s/p 4:33:12 } +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 249/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 2.6095595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:13,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.44011 samples/s/p 4:32:41 } +2024-07-25 20:36:16,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 251/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.6091344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:16,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.5% |███████████████ | 5.43597 samples/s/p 4:32:50 } +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 253/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.6087086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:19,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43679 samples/s/p 4:32:45 } +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 255/ 1625], loss: 1.192, per_step_time: 1474ms, lr: 2.608283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:22,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42391 samples/s/p 4:33:21 } +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 257/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.607857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:25,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43710 samples/s/p 4:32:38 } +2024-07-25 20:36:28,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 259/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 2.6074307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:28,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.44215 samples/s/p 4:32:20 } +2024-07-25 20:36:31,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 261/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 2.6070044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:31,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43053 samples/s/p 4:32:52 } +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 263/ 1625], loss: 1.043, per_step_time: 1473ms, lr: 2.6065778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:34,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.42801 samples/s/p 4:32:57 } +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 265/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 2.6061514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:37,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43629 samples/s/p 4:32:29 } +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 267/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.6057243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:40,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.6% |███████████████ | 5.43667 samples/s/p 4:32:25 } +2024-07-25 20:36:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 269/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.6052974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:43,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44143 samples/s/p 4:32:08 } +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 271/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 2.6048701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:46,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43141 samples/s/p 4:32:35 } +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 273/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.6044425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:49,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43644 samples/s/p 4:32:17 } +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 275/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.6040148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:52,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43668 samples/s/p 4:32:13 } +2024-07-25 20:36:54,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 277/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.6035868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:54,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.44161 samples/s/p 4:31:55 } +2024-07-25 20:36:57,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 279/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 2.6031588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:36:57,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.42686 samples/s/p 4:32:37 } +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 281/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.6027305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:00,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43365 samples/s/p 4:32:13 } +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 283/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.6023019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:03,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.7% |███████████████ | 5.43476 samples/s/p 4:32:07 } +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 285/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.6018733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:06,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43292 samples/s/p 4:32:10 } +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 287/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.6014444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:09,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43089 samples/s/p 4:32:13 } +2024-07-25 20:37:12,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 289/ 1625], loss: 1.329, per_step_time: 1470ms, lr: 2.6010153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:12,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43929 samples/s/p 4:31:45 } +2024-07-25 20:37:15,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 291/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 2.600586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:15,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43093 samples/s/p 4:32:07 } +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 293/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 2.6001566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:18,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43074 samples/s/p 4:32:04 } +2024-07-25 20:37:21,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 295/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.599727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:21,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43537 samples/s/p 4:31:48 } +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 297/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.5992971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:24,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43498 samples/s/p 4:31:46 } +2024-07-25 20:37:27,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 299/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.5988671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:27,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.8% |███████████████ | 5.43784 samples/s/p 4:31:34 } +2024-07-25 20:37:30,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 301/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.5984367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:30,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43415 samples/s/p 4:31:42 } +2024-07-25 20:37:33,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 303/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 2.5980064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:33,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43260 samples/s/p 4:31:44 } +2024-07-25 20:37:36,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 305/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 2.5975756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:36,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43577 samples/s/p 4:31:32 } +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 307/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 2.5971449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:39,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43005 samples/s/p 4:31:46 } +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 309/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.596714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43586 samples/s/p 4:31:25 } +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 311/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 2.5962827e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:45,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.44032 samples/s/p 4:31:09 } +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 313/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 2.5958512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:48,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43492 samples/s/p 4:31:22 } +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 315/ 1625], loss: 1.389, per_step_time: 1472ms, lr: 2.5954198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:51,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 31.9% |███████████████ | 5.43415 samples/s/p 4:31:22 } +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 317/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 2.594988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43595 samples/s/p 4:31:13 } +2024-07-25 20:37:56,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 319/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 2.594556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:56,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.43708 samples/s/p 4:31:07 } +2024-07-25 20:37:59,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 321/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 2.594124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:37:59,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.42961 samples/s/p 4:31:26 } +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 323/ 1625], loss: 1.226, per_step_time: 1470ms, lr: 2.5936914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:02,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |███████████████ | 5.44067 samples/s/p 4:30:50 } +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 325/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.5932592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:05,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43667 samples/s/p 4:30:59 } +2024-07-25 20:38:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 327/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 2.5928262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:08,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44166 samples/s/p 4:30:42 } +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 329/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 2.5923935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:11,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43402 samples/s/p 4:31:02 } +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 331/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 2.5919602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:14,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.43801 samples/s/p 4:30:47 } +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 333/ 1625], loss: 1.221, per_step_time: 1469ms, lr: 2.591527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:17,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.0% |████████████████ | 5.44452 samples/s/p 4:30:24 } +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 335/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.5910935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:20,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43268 samples/s/p 4:30:57 } +2024-07-25 20:38:23,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 337/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.5906598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:23,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43577 samples/s/p 4:30:44 } +2024-07-25 20:38:26,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 339/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.5902258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:26,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43649 samples/s/p 4:30:39 } +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 341/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 2.5897916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:29,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43088 samples/s/p 4:30:53 } +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 343/ 1625], loss: 0.974, per_step_time: 1470ms, lr: 2.5893574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:32,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.44009 samples/s/p 4:30:23 } +2024-07-25 20:38:35,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 345/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 2.5889229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:35,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43376 samples/s/p 4:30:39 } +2024-07-25 20:38:38,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 347/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 2.5884883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:38,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.43288 samples/s/p 4:30:38 } +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 349/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 2.5880534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:41,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.1% |████████████████ | 5.42973 samples/s/p 4:30:45 } +2024-07-25 20:38:44,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 351/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.5876187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43529 samples/s/p 4:30:25 } +2024-07-25 20:38:47,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 353/ 1625], loss: 1.186, per_step_time: 1475ms, lr: 2.5871832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:47,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.42188 samples/s/p 4:31:03 } +2024-07-25 20:38:50,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 355/ 1625], loss: 1.323, per_step_time: 1472ms, lr: 2.5867479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43322 samples/s/p 4:30:26 } +2024-07-25 20:38:53,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 357/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.5863124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:53,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.44020 samples/s/p 4:30:02 } +2024-07-25 20:38:55,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 359/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.5858766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:55,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43591 samples/s/p 4:30:12 } +2024-07-25 20:38:58,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 361/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5854404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:38:58,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43594 samples/s/p 4:30:09 } +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 363/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.5850044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:01,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43514 samples/s/p 4:30:08 } +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 365/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 2.5845678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:04,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.2% |████████████████ | 5.43671 samples/s/p 4:30:00 } +2024-07-25 20:39:07,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 2.5841315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:07,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43644 samples/s/p 4:29:58 } +2024-07-25 20:39:10,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 369/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.5836945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:10,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44209 samples/s/p 4:29:39 } +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 371/ 1625], loss: 1.035, per_step_time: 1472ms, lr: 2.5832576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:13,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43229 samples/s/p 4:30:05 } +2024-07-25 20:39:16,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 373/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5828205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:16,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43340 samples/s/p 4:29:59 } +2024-07-25 20:39:19,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 375/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.5823832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:19,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43304 samples/s/p 4:29:57 } +2024-07-25 20:39:22,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 377/ 1625], loss: 0.949, per_step_time: 1469ms, lr: 2.5819456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:22,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.44558 samples/s/p 4:29:16 } +2024-07-25 20:39:25,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 379/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.581508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:25,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43055 samples/s/p 4:29:58 } +2024-07-25 20:39:28,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 381/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 2.58107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:28,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.3% |████████████████ | 5.43496 samples/s/p 4:29:42 } +2024-07-25 20:39:31,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 383/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.580632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:31,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43496 samples/s/p 4:29:39 } +2024-07-25 20:39:34,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 385/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5801935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:34,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44015 samples/s/p 4:29:21 } +2024-07-25 20:39:37,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 387/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 2.5797552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:37,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.44210 samples/s/p 4:29:12 } +2024-07-25 20:39:40,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 389/ 1625], loss: 1.197, per_step_time: 1475ms, lr: 2.5793164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:40,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.42213 samples/s/p 4:30:09 } +2024-07-25 20:39:43,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 391/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.5788773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:43,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43439 samples/s/p 4:29:29 } +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 393/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.5784384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:46,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43463 samples/s/p 4:29:25 } +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 395/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 2.5779993e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:49,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43276 samples/s/p 4:29:28 } +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 397/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.5775596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:52,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.4% |████████████████ | 5.43181 samples/s/p 4:29:28 } +2024-07-25 20:39:55,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 399/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.5771202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:55,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43357 samples/s/p 4:29:20 } +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 401/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5766803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:39:57,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43151 samples/s/p 4:29:23 } +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 403/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.5762403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:00,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43307 samples/s/p 4:29:15 } +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 405/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 2.5758001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:03,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43633 samples/s/p 4:29:03 } +2024-07-25 20:40:06,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 407/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 2.57536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:06,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42949 samples/s/p 4:29:20 } +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 409/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 2.5749192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:09,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43643 samples/s/p 4:28:57 } +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 411/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.5744786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:12,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.43823 samples/s/p 4:28:48 } +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 413/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.5740377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:15,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.5% |████████████████ | 5.42812 samples/s/p 4:29:15 } +2024-07-25 20:40:18,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 415/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.5735966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:18,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43833 samples/s/p 4:28:42 } +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 417/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 2.5731553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:21,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43648 samples/s/p 4:28:45 } +2024-07-25 20:40:24,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 419/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 2.5727139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:24,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43750 samples/s/p 4:28:39 } +2024-07-25 20:40:27,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 421/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.572272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:27,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43278 samples/s/p 4:28:50 } +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 423/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.5718302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:30,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43141 samples/s/p 4:28:51 } +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 425/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.571388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:33,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43437 samples/s/p 4:28:39 } +2024-07-25 20:40:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 427/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.5709458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43018 samples/s/p 4:28:49 } +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 429/ 1625], loss: 1.340, per_step_time: 1471ms, lr: 2.5705032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:39,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.6% |████████████████ | 5.43557 samples/s/p 4:28:30 } +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 431/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.5700607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:42,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.42728 samples/s/p 4:28:51 } +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 433/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.5696178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43581 samples/s/p 4:28:23 } +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 435/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.5691748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:48,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43288 samples/s/p 4:28:29 } +2024-07-25 20:40:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 437/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.5687315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43208 samples/s/p 4:28:28 } +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 439/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 2.5682884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:54,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43521 samples/s/p 4:28:16 } +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 441/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.5678448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43901 samples/s/p 4:28:02 } +2024-07-25 20:40:59,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 443/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 2.5674008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:40:59,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43856 samples/s/p 4:28:00 } +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 445/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 2.5669571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:02,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.7% |████████████████ | 5.43296 samples/s/p 4:28:14 } +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 447/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 2.5665127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:05,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43616 samples/s/p 4:28:01 } +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 449/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 2.5660685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:08,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43896 samples/s/p 4:27:50 } +2024-07-25 20:41:11,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 451/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 2.565624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:11,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43338 samples/s/p 4:28:04 } +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 453/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.5651794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:14,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43732 samples/s/p 4:27:49 } +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 455/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 2.5647345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:17,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43577 samples/s/p 4:27:51 } +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 457/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.5642892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:20,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43306 samples/s/p 4:27:56 } +2024-07-25 20:41:23,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 459/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.563844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:23,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43781 samples/s/p 4:27:39 } +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 461/ 1625], loss: 1.362, per_step_time: 1472ms, lr: 2.5633986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:26,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43303 samples/s/p 4:27:50 } +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 463/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 2.562953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:29,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.8% |████████████████ | 5.43686 samples/s/p 4:27:36 } +2024-07-25 20:41:32,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 465/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 2.5625071e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:32,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43930 samples/s/p 4:27:26 } +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 467/ 1625], loss: 1.282, per_step_time: 1469ms, lr: 2.5620611e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:35,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.44343 samples/s/p 4:27:11 } +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 469/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.561615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:38,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43139 samples/s/p 4:27:43 } +2024-07-25 20:41:41,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 471/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 2.5611685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:41,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43544 samples/s/p 4:27:28 } +2024-07-25 20:41:44,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 473/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.5607218e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:44,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43512 samples/s/p 4:27:26 } +2024-07-25 20:41:47,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 475/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.560275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:47,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43263 samples/s/p 4:27:31 } +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 477/ 1625], loss: 0.968, per_step_time: 1471ms, lr: 2.5598283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:50,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43762 samples/s/p 4:27:13 } +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 479/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.559381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:53,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 32.9% |████████████████ | 5.43308 samples/s/p 4:27:23 } +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 481/ 1625], loss: 1.331, per_step_time: 1472ms, lr: 2.5589337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:55,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43208 samples/s/p 4:27:23 } +2024-07-25 20:41:58,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 483/ 1625], loss: 0.845, per_step_time: 1472ms, lr: 2.5584863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:41:58,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43377 samples/s/p 4:27:16 } +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 485/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 2.5580384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:01,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43329 samples/s/p 4:27:14 } +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 487/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.5575904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43716 samples/s/p 4:27:00 } +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 489/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.5571424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:07,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43417 samples/s/p 4:27:05 } +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 491/ 1625], loss: 0.914, per_step_time: 1471ms, lr: 2.5566942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:10,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43838 samples/s/p 4:26:50 } +2024-07-25 20:42:13,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 493/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.5562456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:13,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43558 samples/s/p 4:26:55 } +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 495/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.5557973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:16,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.0% |████████████████ | 5.43419 samples/s/p 4:26:57 } +2024-07-25 20:42:19,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 497/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 2.5553481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:19,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.44048 samples/s/p 4:26:35 } +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 499/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.5548994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:22,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43813 samples/s/p 4:26:39 } +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 501/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.5544505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:25,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43486 samples/s/p 4:26:46 } +2024-07-25 20:42:28,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 503/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.554001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:28,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43950 samples/s/p 4:26:29 } +2024-07-25 20:42:31,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 505/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.5535512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:31,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43209 samples/s/p 4:26:48 } +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 507/ 1625], loss: 1.000, per_step_time: 1473ms, lr: 2.5531017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:34,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.42965 samples/s/p 4:26:52 } +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 509/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.5526517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:37,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43066 samples/s/p 4:26:46 } +2024-07-25 20:42:40,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 511/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.5522017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:40,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.1% |████████████████ | 5.43591 samples/s/p 4:26:28 } +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 513/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 2.5517515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:43,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43331 samples/s/p 4:26:33 } +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 515/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.5513009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:46,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43840 samples/s/p 4:26:15 } +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 517/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.5508501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:49,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43424 samples/s/p 4:26:24 } +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 519/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5503994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:52,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43477 samples/s/p 4:26:20 } +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 521/ 1625], loss: 1.062, per_step_time: 1483ms, lr: 2.5499483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:55,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.39279 samples/s/p 4:28:21 } +2024-07-25 20:42:57,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 523/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.5494972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:42:57,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43404 samples/s/p 4:26:16 } +2024-07-25 20:43:00,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 525/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 2.5490457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:00,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.43217 samples/s/p 4:26:18 } +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 527/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 2.548594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:03,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.2% |████████████████ | 5.42987 samples/s/p 4:26:22 } +2024-07-25 20:43:06,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 529/ 1625], loss: 1.331, per_step_time: 1470ms, lr: 2.5481426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:06,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43890 samples/s/p 4:25:53 } +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 531/ 1625], loss: 1.348, per_step_time: 1471ms, lr: 2.5476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43818 samples/s/p 4:25:52 } +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 533/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.5472384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:12,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43647 samples/s/p 4:25:54 } +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 535/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 2.5467862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:15,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.44092 samples/s/p 4:25:38 } +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 537/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.5463336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43492 samples/s/p 4:25:53 } +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 539/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.5458809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:21,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43613 samples/s/p 4:25:46 } +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 541/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.545428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:24,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43251 samples/s/p 4:25:54 } +2024-07-25 20:43:27,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 543/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.544975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.3% |████████████████ | 5.43940 samples/s/p 4:25:31 } +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 545/ 1625], loss: 1.357, per_step_time: 1473ms, lr: 2.5445217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:30,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42804 samples/s/p 4:26:01 } +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 547/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.5440682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:33,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43251 samples/s/p 4:25:45 } +2024-07-25 20:43:36,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 549/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.5436146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.42988 samples/s/p 4:25:50 } +2024-07-25 20:43:39,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 551/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 2.543161e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:39,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43609 samples/s/p 4:25:29 } +2024-07-25 20:43:42,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 553/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5427067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43100 samples/s/p 4:25:41 } +2024-07-25 20:43:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 555/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.5422527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43824 samples/s/p 4:25:16 } +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 557/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 2.5417983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:48,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43458 samples/s/p 4:25:24 } +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 559/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.5413437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:51,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.4% |████████████████ | 5.43066 samples/s/p 4:25:33 } +2024-07-25 20:43:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 561/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 2.540889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:54,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44286 samples/s/p 4:24:54 } +2024-07-25 20:43:57,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 563/ 1625], loss: 1.052, per_step_time: 1474ms, lr: 2.540434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:57,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42715 samples/s/p 4:25:37 } +2024-07-25 20:43:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 565/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5399791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:43:59,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43261 samples/s/p 4:25:18 } +2024-07-25 20:44:02,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 567/ 1625], loss: 1.009, per_step_time: 1473ms, lr: 2.5395238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:02,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.42929 samples/s/p 4:25:25 } +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 569/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.5390684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:05,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43367 samples/s/p 4:25:09 } +2024-07-25 20:44:08,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 571/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 2.5386127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:08,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.44066 samples/s/p 4:24:46 } +2024-07-25 20:44:11,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 573/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 2.5381569e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:11,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43467 samples/s/p 4:25:00 } +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 575/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.5377009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:14,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.5% |████████████████ | 5.43398 samples/s/p 4:24:59 } +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 577/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.5372448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:17,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43769 samples/s/p 4:24:46 } +2024-07-25 20:44:20,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 579/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.5367885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:20,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43951 samples/s/p 4:24:37 } +2024-07-25 20:44:23,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 581/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.5363319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:23,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43609 samples/s/p 4:24:44 } +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 583/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.5358753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:26,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43433 samples/s/p 4:24:47 } +2024-07-25 20:44:29,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 585/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 2.5354186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:29,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43539 samples/s/p 4:24:41 } +2024-07-25 20:44:32,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 587/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.5349613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:32,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43318 samples/s/p 4:24:44 } +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 589/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.5345042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43157 samples/s/p 4:24:46 } +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 591/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5340469e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:38,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.43138 samples/s/p 4:24:44 } +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 593/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 2.533589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:41,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.6% |████████████████ | 5.42983 samples/s/p 4:24:45 } +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 595/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.5331314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:44,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43072 samples/s/p 4:24:40 } +2024-07-25 20:44:47,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 597/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 2.5326734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:47,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43942 samples/s/p 4:24:11 } +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 599/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.5322151e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:50,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43390 samples/s/p 4:24:24 } +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 601/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.5317566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:53,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43949 samples/s/p 4:24:05 } +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 603/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.531298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.44033 samples/s/p 4:24:00 } +2024-07-25 20:44:58,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 605/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.5308394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:44:58,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43430 samples/s/p 4:24:14 } +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 607/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.5303805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:01,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43684 samples/s/p 4:24:04 } +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 609/ 1625], loss: 1.196, per_step_time: 1470ms, lr: 2.5299214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:04,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.7% |████████████████ | 5.43927 samples/s/p 4:23:54 } +2024-07-25 20:45:07,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 611/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 2.5294623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:07,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43682 samples/s/p 4:23:58 } +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 613/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 2.5290028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:10,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43293 samples/s/p 4:24:07 } +2024-07-25 20:45:13,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 615/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 2.5285432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:13,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43882 samples/s/p 4:23:46 } +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 617/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 2.5280837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:16,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43974 samples/s/p 4:23:41 } +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.5276235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:19,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43604 samples/s/p 4:23:49 } +2024-07-25 20:45:22,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 621/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 2.527163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:22,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.43887 samples/s/p 4:23:37 } +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 623/ 1625], loss: 1.220, per_step_time: 1469ms, lr: 2.526703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:25,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44301 samples/s/p 4:23:23 } +2024-07-25 20:45:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 625/ 1625], loss: 1.311, per_step_time: 1469ms, lr: 2.5262425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:28,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.8% |████████████████ | 5.44470 samples/s/p 4:23:15 } +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 627/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.525782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:31,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43741 samples/s/p 4:23:33 } +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 629/ 1625], loss: 1.081, per_step_time: 1473ms, lr: 2.525321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:34,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42749 samples/s/p 4:23:59 } +2024-07-25 20:45:37,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 631/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.52486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:37,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43606 samples/s/p 4:23:31 } +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 633/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 2.5243986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42783 samples/s/p 4:23:52 } +2024-07-25 20:45:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 635/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 2.5239373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43904 samples/s/p 4:23:16 } +2024-07-25 20:45:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 637/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 2.5234756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:46,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.43845 samples/s/p 4:23:15 } +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 639/ 1625], loss: 1.307, per_step_time: 1470ms, lr: 2.523014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:49,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.44059 samples/s/p 4:23:06 } +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 641/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 2.522552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:52,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 33.9% |████████████████ | 5.42640 samples/s/p 4:23:44 } +2024-07-25 20:45:55,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 643/ 1625], loss: 0.997, per_step_time: 1473ms, lr: 2.5220897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:55,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.42933 samples/s/p 4:23:33 } +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 645/ 1625], loss: 1.323, per_step_time: 1473ms, lr: 2.5216274e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:45:57,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43025 samples/s/p 4:23:27 } +2024-07-25 20:46:00,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 647/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.521165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:00,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43376 samples/s/p 4:23:14 } +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 649/ 1625], loss: 1.322, per_step_time: 1472ms, lr: 2.5207022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:03,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |████████████████ | 5.43153 samples/s/p 4:23:18 } +2024-07-25 20:46:06,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 651/ 1625], loss: 1.077, per_step_time: 1470ms, lr: 2.5202393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:06,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.43956 samples/s/p 4:22:51 } +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 653/ 1625], loss: 1.238, per_step_time: 1473ms, lr: 2.5197764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:09,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.42996 samples/s/p 4:23:16 } +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 655/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 2.519313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44036 samples/s/p 4:22:43 } +2024-07-25 20:46:15,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 657/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.5188498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.0% |█████████████████ | 5.44071 samples/s/p 4:22:39 } +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 659/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.5183861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43619 samples/s/p 4:22:49 } +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 661/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.5179223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:21,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43516 samples/s/p 4:22:49 } +2024-07-25 20:46:24,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 663/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.5174584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:24,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43859 samples/s/p 4:22:37 } +2024-07-25 20:46:27,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 665/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 2.5169942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:27,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.44080 samples/s/p 4:22:27 } +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 667/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.51653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:30,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43504 samples/s/p 4:22:41 } +2024-07-25 20:46:33,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 669/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 2.5160656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:33,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43062 samples/s/p 4:22:51 } +2024-07-25 20:46:36,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 671/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.5156009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:36,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.42759 samples/s/p 4:22:57 } +2024-07-25 20:46:39,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 673/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.5151363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:39,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.1% |█████████████████ | 5.43433 samples/s/p 4:22:34 } +2024-07-25 20:46:42,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 675/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.5146714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:42,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43994 samples/s/p 4:22:15 } +2024-07-25 20:46:45,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 677/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 2.514206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:45,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43700 samples/s/p 4:22:21 } +2024-07-25 20:46:48,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 679/ 1625], loss: 1.325, per_step_time: 1473ms, lr: 2.5137408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:48,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42913 samples/s/p 4:22:40 } +2024-07-25 20:46:51,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 681/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.5132751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:51,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43826 samples/s/p 4:22:11 } +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 683/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.5128094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:54,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.42786 samples/s/p 4:22:38 } +2024-07-25 20:46:56,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 685/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.5123436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:56,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43162 samples/s/p 4:22:24 } +2024-07-25 20:46:59,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 687/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 2.5118774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:46:59,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43383 samples/s/p 4:22:15 } +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 689/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.5114114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:02,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.2% |█████████████████ | 5.43875 samples/s/p 4:21:58 } +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 691/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.510945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:05,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43513 samples/s/p 4:22:05 } +2024-07-25 20:47:08,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 693/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 2.5104782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:08,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43377 samples/s/p 4:22:06 } +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 695/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.5100115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:11,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43126 samples/s/p 4:22:11 } +2024-07-25 20:47:14,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 697/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 2.5095445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:14,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43620 samples/s/p 4:21:53 } +2024-07-25 20:47:17,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 699/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.5090774e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:17,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43670 samples/s/p 4:21:49 } +2024-07-25 20:47:20,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 701/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.50861e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:20,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43474 samples/s/p 4:21:52 } +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 703/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.5081426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:23,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43976 samples/s/p 4:21:34 } +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 705/ 1625], loss: 1.310, per_step_time: 1471ms, lr: 2.5076748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:26,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.3% |█████████████████ | 5.43530 samples/s/p 4:21:44 } +2024-07-25 20:47:29,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 707/ 1625], loss: 0.862, per_step_time: 1472ms, lr: 2.5072073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:29,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43283 samples/s/p 4:21:48 } +2024-07-25 20:47:32,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 709/ 1625], loss: 1.267, per_step_time: 1474ms, lr: 2.5067391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:32,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42638 samples/s/p 4:22:04 } +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 711/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 2.506271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:35,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43926 samples/s/p 4:21:24 } +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 713/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.5058027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:38,310 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42884 samples/s/p 4:21:51 } +2024-07-25 20:47:41,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 715/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.5053341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:41,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43384 samples/s/p 4:21:34 } +2024-07-25 20:47:44,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 717/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.5048654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:44,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43682 samples/s/p 4:21:22 } +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 719/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.5043966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:47,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.42962 samples/s/p 4:21:40 } +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 721/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.5039275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:50,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43182 samples/s/p 4:21:31 } +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 723/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.5034584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:53,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.4% |█████████████████ | 5.43234 samples/s/p 4:21:26 } +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 725/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.5029889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:47:56,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.42976 samples/s/p 4:21:31 } +2024-07-25 20:47:56,025 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 727/ 1625], loss: 1.002, per_step_time: 1836ms, lr: 2.5025192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:31,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 4.35501 samples/s/p 5:25:59 } +2024-07-25 20:48:34,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 729/ 1625], loss: 0.904, per_step_time: 1472ms, lr: 2.5020494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:34,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43401 samples/s/p 4:21:13 } +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 731/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 2.5015794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.44121 samples/s/p 4:20:49 } +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 733/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.5011092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43478 samples/s/p 4:21:05 } +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 735/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.5006391e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:42,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43618 samples/s/p 4:20:58 } +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 737/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.5001686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43455 samples/s/p 4:20:59 } +2024-07-25 20:48:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 739/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 2.4996976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.5% |█████████████████ | 5.43626 samples/s/p 4:20:51 } +2024-07-25 20:48:51,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 741/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.499227e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43251 samples/s/p 4:20:59 } +2024-07-25 20:48:54,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 743/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 2.498756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:54,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43974 samples/s/p 4:20:36 } +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 745/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 2.4982848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:48:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43255 samples/s/p 4:20:53 } +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 747/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 2.4978135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:00,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43849 samples/s/p 4:20:33 } +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 749/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 2.4973418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:03,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43658 samples/s/p 4:20:36 } +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 751/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4968702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:06,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43816 samples/s/p 4:20:28 } +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 753/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.4963983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:09,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43156 samples/s/p 4:20:44 } +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 755/ 1625], loss: 0.919, per_step_time: 1471ms, lr: 2.4959261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:12,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.6% |█████████████████ | 5.43641 samples/s/p 4:20:27 } +2024-07-25 20:49:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 757/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 2.495454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:15,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.42789 samples/s/p 4:20:49 } +2024-07-25 20:49:18,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 759/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.4949815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:18,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43763 samples/s/p 4:20:18 } +2024-07-25 20:49:21,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 761/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.4945093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:21,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44002 samples/s/p 4:20:08 } +2024-07-25 20:49:24,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 763/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 2.4940364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:25,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43751 samples/s/p 4:20:13 } +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 765/ 1625], loss: 1.161, per_step_time: 1469ms, lr: 2.4935633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:28,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44580 samples/s/p 4:19:46 } +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 767/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 2.4930905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:30,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43633 samples/s/p 4:20:10 } +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 769/ 1625], loss: 1.214, per_step_time: 1470ms, lr: 2.4926172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:33,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.44017 samples/s/p 4:19:56 } +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 771/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.4921437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:36,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.7% |█████████████████ | 5.43487 samples/s/p 4:20:08 } +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 773/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.49167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:39,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43506 samples/s/p 4:20:05 } +2024-07-25 20:49:42,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 775/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.4911962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:42,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43348 samples/s/p 4:20:06 } +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 777/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.4907225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:45,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43718 samples/s/p 4:19:53 } +2024-07-25 20:49:48,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 779/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.4902482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:48,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43367 samples/s/p 4:20:00 } +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 781/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.4897738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:51,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43587 samples/s/p 4:19:51 } +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 783/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 2.4892994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:54,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43668 samples/s/p 4:19:45 } +2024-07-25 20:49:57,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 785/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.4888246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:49:57,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43848 samples/s/p 4:19:37 } +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 787/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.4883499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:00,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.8% |█████████████████ | 5.43056 samples/s/p 4:19:57 } +2024-07-25 20:50:03,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 789/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 2.4878751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:03,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44032 samples/s/p 4:19:26 } +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 791/ 1625], loss: 1.425, per_step_time: 1471ms, lr: 2.4873994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:06,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43764 samples/s/p 4:19:31 } +2024-07-25 20:50:09,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 793/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.4869241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:09,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.42799 samples/s/p 4:19:56 } +2024-07-25 20:50:12,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 795/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 2.486449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:12,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43840 samples/s/p 4:19:23 } +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 797/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 2.4859732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:16,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43938 samples/s/p 4:19:17 } +2024-07-25 20:50:18,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 799/ 1625], loss: 1.219, per_step_time: 1469ms, lr: 2.4854971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:18,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.44231 samples/s/p 4:19:06 } +2024-07-25 20:50:21,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 801/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.4850215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:21,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43443 samples/s/p 4:19:25 } +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 803/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.484545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:24,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 34.9% |█████████████████ | 5.43336 samples/s/p 4:19:26 } +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 805/ 1625], loss: 1.381, per_step_time: 1471ms, lr: 2.4840687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:27,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43618 samples/s/p 4:19:15 } +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 807/ 1625], loss: 1.324, per_step_time: 1474ms, lr: 2.4835923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:30,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42535 samples/s/p 4:19:43 } +2024-07-25 20:50:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 809/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 2.4831155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:33,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43058 samples/s/p 4:19:25 } +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 811/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.4826384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:36,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42871 samples/s/p 4:19:27 } +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 813/ 1625], loss: 1.053, per_step_time: 1474ms, lr: 2.4821613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:39,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42724 samples/s/p 4:19:28 } +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 815/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.4816842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:42,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43650 samples/s/p 4:18:59 } +2024-07-25 20:50:45,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 817/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.4812067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:45,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.42909 samples/s/p 4:19:17 } +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 819/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 2.480729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:48,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.0% |█████████████████ | 5.43423 samples/s/p 4:19:00 } +2024-07-25 20:50:51,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 821/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.4802514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:51,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43491 samples/s/p 4:18:55 } +2024-07-25 20:50:54,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 823/ 1625], loss: 1.107, per_step_time: 1470ms, lr: 2.4797733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:54,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43870 samples/s/p 4:18:41 } +2024-07-25 20:50:57,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 825/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 2.4792951e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:50:57,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43059 samples/s/p 4:19:01 } +2024-07-25 20:51:00,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 827/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 2.478817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:00,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43946 samples/s/p 4:18:33 } +2024-07-25 20:51:03,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 829/ 1625], loss: 1.320, per_step_time: 1473ms, lr: 2.4783385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:03,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.42858 samples/s/p 4:19:01 } +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 831/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 2.4778597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:06,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43333 samples/s/p 4:18:44 } +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 833/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.477381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:09,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43143 samples/s/p 4:18:47 } +2024-07-25 20:51:12,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 835/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 2.476902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:12,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.1% |█████████████████ | 5.43156 samples/s/p 4:18:44 } +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 837/ 1625], loss: 1.244, per_step_time: 1474ms, lr: 2.476423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:15,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42538 samples/s/p 4:18:58 } +2024-07-25 20:51:18,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 839/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 2.4759434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:18,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43825 samples/s/p 4:18:19 } +2024-07-25 20:51:20,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 841/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 2.4754641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:20,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43497 samples/s/p 4:18:25 } +2024-07-25 20:51:23,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 843/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 2.4749845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:23,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43687 samples/s/p 4:18:17 } +2024-07-25 20:51:26,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 845/ 1625], loss: 1.298, per_step_time: 1474ms, lr: 2.474505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:26,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42574 samples/s/p 4:18:45 } +2024-07-25 20:51:29,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 847/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.4740246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:29,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.43603 samples/s/p 4:18:13 } +2024-07-25 20:51:32,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 849/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4735444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:32,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.44032 samples/s/p 4:17:58 } +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 851/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 2.4730645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:35,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42803 samples/s/p 4:18:30 } +2024-07-25 20:51:38,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 853/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 2.472584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:38,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.2% |█████████████████ | 5.42927 samples/s/p 4:18:24 } +2024-07-25 20:51:41,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 855/ 1625], loss: 0.942, per_step_time: 1470ms, lr: 2.472103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:41,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43913 samples/s/p 4:17:53 } +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 857/ 1625], loss: 1.369, per_step_time: 1470ms, lr: 2.4716222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:44,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43897 samples/s/p 4:17:50 } +2024-07-25 20:51:47,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 859/ 1625], loss: 1.313, per_step_time: 1470ms, lr: 2.4711413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:47,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43954 samples/s/p 4:17:46 } +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 861/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.47066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:50,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43557 samples/s/p 4:17:54 } +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 863/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.4701789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43463 samples/s/p 4:17:54 } +2024-07-25 20:51:56,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 865/ 1625], loss: 1.142, per_step_time: 1477ms, lr: 2.4696972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:56,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.41557 samples/s/p 4:18:45 } +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 867/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 2.4692155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:51:59,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43717 samples/s/p 4:17:40 } +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 869/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.4687335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:02,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.3% |█████████████████ | 5.43512 samples/s/p 4:17:43 } +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 871/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 2.4682515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:05,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43198 samples/s/p 4:17:49 } +2024-07-25 20:52:08,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 873/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 2.4677693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:08,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43016 samples/s/p 4:17:52 } +2024-07-25 20:52:11,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 875/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 2.467287e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:11,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43283 samples/s/p 4:17:41 } +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 877/ 1625], loss: 1.386, per_step_time: 1473ms, lr: 2.4668043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:14,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42984 samples/s/p 4:17:47 } +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 879/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 2.4663217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:17,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42952 samples/s/p 4:17:45 } +2024-07-25 20:52:19,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 881/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 2.4658388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.44147 samples/s/p 4:17:08 } +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 883/ 1625], loss: 1.088, per_step_time: 1475ms, lr: 2.4653558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:22,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.42359 samples/s/p 4:17:56 } +2024-07-25 20:52:25,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 885/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 2.4648729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:25,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.4% |█████████████████ | 5.43609 samples/s/p 4:17:17 } +2024-07-25 20:52:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 887/ 1625], loss: 1.284, per_step_time: 1473ms, lr: 2.4643892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:28,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43060 samples/s/p 4:17:30 } +2024-07-25 20:52:31,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 889/ 1625], loss: 1.345, per_step_time: 1472ms, lr: 2.463906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:31,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43132 samples/s/p 4:17:25 } +2024-07-25 20:52:34,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 891/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.4634222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:34,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43687 samples/s/p 4:17:06 } +2024-07-25 20:52:37,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 893/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.4629384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:37,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43828 samples/s/p 4:16:59 } +2024-07-25 20:52:40,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 895/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.4624542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43899 samples/s/p 4:16:54 } +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 897/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.46197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.42858 samples/s/p 4:17:21 } +2024-07-25 20:52:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 899/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 2.4614856e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43343 samples/s/p 4:17:04 } +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 901/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 2.461001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:49,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.5% |█████████████████ | 5.43235 samples/s/p 4:17:04 } +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 903/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.4605162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:52,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43060 samples/s/p 4:17:06 } +2024-07-25 20:52:55,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 905/ 1625], loss: 1.334, per_step_time: 1472ms, lr: 2.4600313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:55,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43241 samples/s/p 4:16:58 } +2024-07-25 20:52:58,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 907/ 1625], loss: 1.172, per_step_time: 1483ms, lr: 2.4595463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:52:58,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.39208 samples/s/p 4:18:50 } +2024-07-25 20:53:01,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 909/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.4590609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:01,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43526 samples/s/p 4:16:44 } +2024-07-25 20:53:04,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 911/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 2.4585755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:04,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43077 samples/s/p 4:16:54 } +2024-07-25 20:53:07,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 913/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 2.45809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:07,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43266 samples/s/p 4:16:46 } +2024-07-25 20:53:10,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 915/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.4576042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:10,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43630 samples/s/p 4:16:32 } +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 917/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 2.4571184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:13,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.6% |█████████████████ | 5.43191 samples/s/p 4:16:42 } +2024-07-25 20:53:16,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 919/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 2.4566321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:16,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43066 samples/s/p 4:16:42 } +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 921/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.456146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:19,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43332 samples/s/p 4:16:32 } +2024-07-25 20:53:22,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 923/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.4556595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:22,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43545 samples/s/p 4:16:23 } +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 925/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.4551731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:24,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43562 samples/s/p 4:16:20 } +2024-07-25 20:53:27,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 927/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 2.4546864e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:27,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43781 samples/s/p 4:16:10 } +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 929/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.4541992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:30,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43988 samples/s/p 4:16:02 } +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 931/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.4537121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:33,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.44235 samples/s/p 4:15:52 } +2024-07-25 20:53:36,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 933/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.453225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:36,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.7% |█████████████████ | 5.43698 samples/s/p 4:16:04 } +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 935/ 1625], loss: 1.415, per_step_time: 1471ms, lr: 2.4527375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:39,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43705 samples/s/p 4:16:01 } +2024-07-25 20:53:42,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 937/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.45225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:42,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43112 samples/s/p 4:16:15 } +2024-07-25 20:53:45,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 939/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.4517623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:45,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43361 samples/s/p 4:16:05 } +2024-07-25 20:53:48,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 941/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 2.4512745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:48,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43610 samples/s/p 4:15:55 } +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 943/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 2.450786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:51,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.44051 samples/s/p 4:15:39 } +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 945/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4502982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:54,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43231 samples/s/p 4:15:59 } +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 947/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.4498098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:53:57,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43789 samples/s/p 4:15:41 } +2024-07-25 20:54:00,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 949/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.449321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:00,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.8% |█████████████████ | 5.43290 samples/s/p 4:15:52 } +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 951/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.4488325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:03,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43141 samples/s/p 4:15:53 } +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 953/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.4483435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:06,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43435 samples/s/p 4:15:42 } +2024-07-25 20:54:09,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 955/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.4478544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:09,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43341 samples/s/p 4:15:42 } +2024-07-25 20:54:12,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 957/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4473653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:12,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43666 samples/s/p 4:15:29 } +2024-07-25 20:54:15,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 959/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 2.4468758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:15,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43725 samples/s/p 4:15:25 } +2024-07-25 20:54:18,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 961/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.4463863e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:18,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43277 samples/s/p 4:15:35 } +2024-07-25 20:54:21,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 963/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 2.4458963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:21,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.43115 samples/s/p 4:15:36 } +2024-07-25 20:54:23,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 965/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.4454064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:23,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 35.9% |█████████████████ | 5.42928 samples/s/p 4:15:39 } +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 967/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 2.4449166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:26,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42850 samples/s/p 4:15:38 } +2024-07-25 20:54:29,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 969/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.444426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:29,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43170 samples/s/p 4:15:26 } +2024-07-25 20:54:32,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 971/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.443936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:32,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.43527 samples/s/p 4:15:13 } +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 973/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.4434456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:35,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |█████████████████ | 5.42896 samples/s/p 4:15:28 } +2024-07-25 20:54:38,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 975/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.4429548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:38,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43748 samples/s/p 4:15:01 } +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 977/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.4424635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:41,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44133 samples/s/p 4:14:47 } +2024-07-25 20:54:44,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 979/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 2.4419727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:44,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43048 samples/s/p 4:15:15 } +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 981/ 1625], loss: 1.095, per_step_time: 1469ms, lr: 2.4414816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:47,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.44461 samples/s/p 4:14:32 } +2024-07-25 20:54:50,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 983/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.4409901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:50,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.0% |██████████████████ | 5.43986 samples/s/p 4:14:42 } +2024-07-25 20:54:53,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 985/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.4404984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:53,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43590 samples/s/p 4:14:50 } +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 987/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.440007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:56,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43414 samples/s/p 4:14:52 } +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 989/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 2.4395149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:54:59,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43540 samples/s/p 4:14:46 } +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 991/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.4390229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:02,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43706 samples/s/p 4:14:38 } +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 993/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.4385306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:05,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43602 samples/s/p 4:14:38 } +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 995/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 2.4380382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:08,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43279 samples/s/p 4:14:44 } +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 997/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4375458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:11,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.43265 samples/s/p 4:14:42 } +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 999/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 2.437053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:14,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.1% |██████████████████ | 5.42705 samples/s/p 4:14:55 } +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1001/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.4365601e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:17,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43267 samples/s/p 4:14:36 } +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1003/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 2.4360672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:20,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43533 samples/s/p 4:14:26 } +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1005/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.4355739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:23,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43280 samples/s/p 4:14:30 } +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1007/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.4350806e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43495 samples/s/p 4:14:21 } +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1009/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.434587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:28,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43069 samples/s/p 4:14:30 } +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1011/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.4340932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:31,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43802 samples/s/p 4:14:06 } +2024-07-25 20:55:34,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1013/ 1625], loss: 1.297, per_step_time: 1474ms, lr: 2.4335995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:34,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.42597 samples/s/p 4:14:37 } +2024-07-25 20:55:37,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1015/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 2.4331055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:37,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.2% |██████████████████ | 5.43478 samples/s/p 4:14:09 } +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1017/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.4326111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:40,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43534 samples/s/p 4:14:05 } +2024-07-25 20:55:43,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1019/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 2.432117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43208 samples/s/p 4:14:11 } +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1021/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 2.4316225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43136 samples/s/p 4:14:10 } +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1023/ 1625], loss: 1.379, per_step_time: 1470ms, lr: 2.431128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:49,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43911 samples/s/p 4:13:46 } +2024-07-25 20:55:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1025/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 2.4306331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43507 samples/s/p 4:13:54 } +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1027/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 2.430138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43161 samples/s/p 4:14:01 } +2024-07-25 20:55:58,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1029/ 1625], loss: 1.533, per_step_time: 1472ms, lr: 2.4296429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:55:58,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43444 samples/s/p 4:13:50 } +2024-07-25 20:56:01,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1031/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 2.4291478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.3% |██████████████████ | 5.43637 samples/s/p 4:13:41 } +2024-07-25 20:56:04,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1033/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 2.428652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:04,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43469 samples/s/p 4:13:43 } +2024-07-25 20:56:07,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1035/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.4281568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:07,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.44100 samples/s/p 4:13:23 } +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1037/ 1625], loss: 1.027, per_step_time: 1471ms, lr: 2.427661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:10,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43572 samples/s/p 4:13:34 } +2024-07-25 20:56:13,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1039/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 2.4271649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:13,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42835 samples/s/p 4:13:52 } +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1041/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.4266688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42821 samples/s/p 4:13:50 } +2024-07-25 20:56:19,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1043/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 2.4261724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:19,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43601 samples/s/p 4:13:25 } +2024-07-25 20:56:22,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1045/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.425676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:22,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.43966 samples/s/p 4:13:12 } +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1047/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.4251794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:24,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.4% |██████████████████ | 5.42847 samples/s/p 4:13:40 } +2024-07-25 20:56:27,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1049/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 2.4246825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:27,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43831 samples/s/p 4:13:10 } +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1051/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.4241855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:30,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43352 samples/s/p 4:13:20 } +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1053/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 2.4236884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:33,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43508 samples/s/p 4:13:13 } +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1055/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 2.4231913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:36,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43609 samples/s/p 4:13:07 } +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1057/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.422694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:39,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43660 samples/s/p 4:13:03 } +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1059/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.4221965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:42,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43484 samples/s/p 4:13:05 } +2024-07-25 20:56:45,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1061/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 2.421699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:45,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43588 samples/s/p 4:12:59 } +2024-07-25 20:56:48,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1063/ 1625], loss: 1.396, per_step_time: 1471ms, lr: 2.421201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:48,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.5% |██████████████████ | 5.43786 samples/s/p 4:12:50 } +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1065/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.4207025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:51,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43174 samples/s/p 4:13:04 } +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1067/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.4202047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:54,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43279 samples/s/p 4:12:58 } +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1069/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 2.4197063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:56:57,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43825 samples/s/p 4:12:40 } +2024-07-25 20:57:00,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1071/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 2.4192077e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:00,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43702 samples/s/p 4:12:41 } +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1073/ 1625], loss: 1.272, per_step_time: 1470ms, lr: 2.418709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:03,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43916 samples/s/p 4:12:32 } +2024-07-25 20:57:06,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1075/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.4182102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:06,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43211 samples/s/p 4:12:49 } +2024-07-25 20:57:09,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1077/ 1625], loss: 1.091, per_step_time: 1482ms, lr: 2.4177112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:09,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.39457 samples/s/p 4:14:31 } +2024-07-25 20:57:12,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1079/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 2.417212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:12,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.6% |██████████████████ | 5.43624 samples/s/p 4:12:31 } +2024-07-25 20:57:15,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1081/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 2.4167124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:15,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44056 samples/s/p 4:12:16 } +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1083/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 2.4162131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:18,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43928 samples/s/p 4:12:17 } +2024-07-25 20:57:21,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1085/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.4157134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:21,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.44112 samples/s/p 4:12:09 } +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1087/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 2.4152136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:24,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43844 samples/s/p 4:12:13 } +2024-07-25 20:57:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1089/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.4147135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43172 samples/s/p 4:12:29 } +2024-07-25 20:57:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1091/ 1625], loss: 0.914, per_step_time: 1472ms, lr: 2.4142133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:29,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43124 samples/s/p 4:12:27 } +2024-07-25 20:57:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1093/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.413713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43229 samples/s/p 4:12:22 } +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1095/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 2.4132125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:35,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.7% |██████████████████ | 5.43768 samples/s/p 4:12:04 } +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1097/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 2.412712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:38,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43426 samples/s/p 4:12:10 } +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1099/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.4122113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43346 samples/s/p 4:12:09 } +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1101/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.4117102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:44,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43950 samples/s/p 4:11:50 } +2024-07-25 20:57:47,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1103/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 2.4112092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:47,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43760 samples/s/p 4:11:52 } +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1105/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.410708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:50,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43104 samples/s/p 4:12:07 } +2024-07-25 20:57:53,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1107/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.4102066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:53,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.44132 samples/s/p 4:11:36 } +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1109/ 1625], loss: 1.166, per_step_time: 1475ms, lr: 2.409705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:56,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.42224 samples/s/p 4:12:26 } +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1111/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.4092036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:57:59,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43343 samples/s/p 4:11:52 } +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1113/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.4087014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:02,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.8% |██████████████████ | 5.43651 samples/s/p 4:11:40 } +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1115/ 1625], loss: 1.393, per_step_time: 1471ms, lr: 2.4081994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:05,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43575 samples/s/p 4:11:40 } +2024-07-25 20:58:08,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1117/ 1625], loss: 1.232, per_step_time: 1484ms, lr: 2.4076973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:08,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.39023 samples/s/p 4:13:44 } +2024-07-25 20:58:11,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1119/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.407195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:11,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43043 samples/s/p 4:11:48 } +2024-07-25 20:58:14,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1121/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4066921e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:14,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43275 samples/s/p 4:11:39 } +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1123/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 2.40619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:17,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43028 samples/s/p 4:11:43 } +2024-07-25 20:58:20,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1125/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 2.4056868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:20,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.42829 samples/s/p 4:11:46 } +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1127/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 2.4051838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:23,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.43561 samples/s/p 4:11:22 } +2024-07-25 20:58:26,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1129/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 2.4046809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:26,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 36.9% |██████████████████ | 5.44085 samples/s/p 4:11:05 } +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1131/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 2.4041776e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43703 samples/s/p 4:11:12 } +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1133/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.4036739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:31,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43519 samples/s/p 4:11:15 } +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1135/ 1625], loss: 1.205, per_step_time: 1469ms, lr: 2.4031702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:34,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.44269 samples/s/p 4:10:51 } +2024-07-25 20:58:37,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1137/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 2.4026664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:37,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43879 samples/s/p 4:10:59 } +2024-07-25 20:58:40,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1139/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.4021625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:40,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.44001 samples/s/p 4:10:52 } +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1141/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.4016585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:43,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43715 samples/s/p 4:10:57 } +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1143/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.4011542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:46,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43327 samples/s/p 4:11:05 } +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1145/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.40065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:49,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.0% |██████████████████ | 5.43758 samples/s/p 4:10:50 } +2024-07-25 20:58:52,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1147/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.4001452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:52,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43250 samples/s/p 4:11:01 } +2024-07-25 20:58:55,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1149/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.3996405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:55,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43609 samples/s/p 4:10:49 } +2024-07-25 20:58:58,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1151/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 2.3991359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:58:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43102 samples/s/p 4:11:00 } +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1153/ 1625], loss: 1.233, per_step_time: 1470ms, lr: 2.3986307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:01,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.44124 samples/s/p 4:10:28 } +2024-07-25 20:59:04,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1155/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3981253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:04,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43398 samples/s/p 4:10:46 } +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1157/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 2.3976201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:07,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43099 samples/s/p 4:10:51 } +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1159/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.3971146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:10,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43896 samples/s/p 4:10:26 } +2024-07-25 20:59:13,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1161/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.3966091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:13,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.1% |██████████████████ | 5.43228 samples/s/p 4:10:41 } +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1163/ 1625], loss: 0.920, per_step_time: 1473ms, lr: 2.396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:16,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.42851 samples/s/p 4:10:49 } +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1165/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.3955972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:19,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43435 samples/s/p 4:10:30 } +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1167/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 2.3950912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:22,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43739 samples/s/p 4:10:18 } +2024-07-25 20:59:25,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1169/ 1625], loss: 0.966, per_step_time: 1470ms, lr: 2.3945848e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:25,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44026 samples/s/p 4:10:08 } +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1171/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.3940784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.44215 samples/s/p 4:09:59 } +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1173/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.3935718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:30,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43730 samples/s/p 4:10:10 } +2024-07-25 20:59:33,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1175/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.393065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43342 samples/s/p 4:10:18 } +2024-07-25 20:59:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1177/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 2.3925579e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:36,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.2% |██████████████████ | 5.43867 samples/s/p 4:10:00 } +2024-07-25 20:59:39,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1179/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.392051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:39,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43293 samples/s/p 4:10:13 } +2024-07-25 20:59:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1181/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.3915436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43472 samples/s/p 4:10:05 } +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1183/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 2.3910365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:45,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42959 samples/s/p 4:10:16 } +2024-07-25 20:59:48,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1185/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.3905288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:48,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43748 samples/s/p 4:09:52 } +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1187/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 2.3900211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:51,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43901 samples/s/p 4:09:45 } +2024-07-25 20:59:54,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1189/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 2.3895132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:54,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43936 samples/s/p 4:09:41 } +2024-07-25 20:59:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1191/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.3890052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 20:59:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.42819 samples/s/p 4:10:09 } +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1193/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.3884972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:00,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.3% |██████████████████ | 5.43543 samples/s/p 4:09:46 } +2024-07-25 21:00:03,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1195/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 2.3879888e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:03,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43859 samples/s/p 4:09:34 } +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1197/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.3874802e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:06,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43863 samples/s/p 4:09:31 } +2024-07-25 21:00:09,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1199/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 2.3869716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:09,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43630 samples/s/p 4:09:34 } +2024-07-25 21:00:12,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1201/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.3864632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:12,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43128 samples/s/p 4:09:45 } +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1203/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3859538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:15,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43665 samples/s/p 4:09:28 } +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1205/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 2.3854449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:18,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43558 samples/s/p 4:09:28 } +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1207/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.3849358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:21,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43349 samples/s/p 4:09:30 } +2024-07-25 21:00:24,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1209/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.3844266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.4% |██████████████████ | 5.43570 samples/s/p 4:09:21 } +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1211/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.3839166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:26,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43764 samples/s/p 4:09:13 } +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1213/ 1625], loss: 1.367, per_step_time: 1473ms, lr: 2.3834073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:29,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43106 samples/s/p 4:09:28 } +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1215/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.3828976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43662 samples/s/p 4:09:10 } +2024-07-25 21:00:35,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1217/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.3823872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:35,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43343 samples/s/p 4:09:16 } +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1219/ 1625], loss: 1.324, per_step_time: 1470ms, lr: 2.3818773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:38,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.44121 samples/s/p 4:08:51 } +2024-07-25 21:00:41,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1221/ 1625], loss: 1.435, per_step_time: 1473ms, lr: 2.3813669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:41,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43020 samples/s/p 4:09:19 } +2024-07-25 21:00:44,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1223/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.3808565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43977 samples/s/p 4:08:50 } +2024-07-25 21:00:47,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1225/ 1625], loss: 1.394, per_step_time: 1472ms, lr: 2.3803459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:47,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.5% |██████████████████ | 5.43221 samples/s/p 4:09:07 } +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1227/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 2.3798351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:50,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44329 samples/s/p 4:08:34 } +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1229/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.379324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:53,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43230 samples/s/p 4:09:01 } +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1231/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.378813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:56,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43515 samples/s/p 4:08:50 } +2024-07-25 21:00:59,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1233/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 2.3783017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:00:59,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43891 samples/s/p 4:08:37 } +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1235/ 1625], loss: 1.003, per_step_time: 1470ms, lr: 2.3777904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:02,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43968 samples/s/p 4:08:32 } +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1237/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.3772787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43977 samples/s/p 4:08:29 } +2024-07-25 21:01:08,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1239/ 1625], loss: 1.181, per_step_time: 1469ms, lr: 2.3767674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:08,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.44271 samples/s/p 4:08:18 } +2024-07-25 21:01:11,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1241/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.3762554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:11,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43647 samples/s/p 4:08:32 } +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.3757435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:14,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.6% |██████████████████ | 5.43527 samples/s/p 4:08:32 } +2024-07-25 21:01:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1245/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.3752315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:17,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42940 samples/s/p 4:08:46 } +2024-07-25 21:01:20,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1247/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 2.374719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:20,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.42804 samples/s/p 4:08:46 } +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1249/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.3742066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:23,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43197 samples/s/p 4:08:33 } +2024-07-25 21:01:25,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1251/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 2.373694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:25,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44137 samples/s/p 4:08:04 } +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1253/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 2.3731813e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:28,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43382 samples/s/p 4:08:22 } +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1255/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 2.3726683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:31,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.44408 samples/s/p 4:07:51 } +2024-07-25 21:01:34,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1257/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.3721554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43660 samples/s/p 4:08:08 } +2024-07-25 21:01:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1259/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 2.371642e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.7% |██████████████████ | 5.43538 samples/s/p 4:08:09 } +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.3711285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:40,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43869 samples/s/p 4:07:57 } +2024-07-25 21:01:43,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1263/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.3706152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:43,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43214 samples/s/p 4:08:12 } +2024-07-25 21:01:46,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1265/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 2.3701015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:46,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43318 samples/s/p 4:08:06 } +2024-07-25 21:01:49,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1267/ 1625], loss: 1.050, per_step_time: 1474ms, lr: 2.3695877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:49,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.42512 samples/s/p 4:08:25 } +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1269/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.3690738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:52,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43186 samples/s/p 4:08:04 } +2024-07-25 21:01:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1271/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.3685594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:55,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43525 samples/s/p 4:07:51 } +2024-07-25 21:01:58,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1273/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.3680452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:01:58,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.43119 samples/s/p 4:07:59 } +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1275/ 1625], loss: 0.887, per_step_time: 1470ms, lr: 2.3675308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:01,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.8% |██████████████████ | 5.44171 samples/s/p 4:07:28 } +2024-07-25 21:02:04,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1277/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 2.3670162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:04,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.42957 samples/s/p 4:07:58 } +2024-07-25 21:02:07,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1279/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.3665016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:07,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43961 samples/s/p 4:07:28 } +2024-07-25 21:02:10,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1281/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 2.3659866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:10,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43642 samples/s/p 4:07:33 } +2024-07-25 21:02:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1283/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 2.3654715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43393 samples/s/p 4:07:37 } +2024-07-25 21:02:16,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1285/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.3649563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43923 samples/s/p 4:07:20 } +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1287/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 2.364441e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:19,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43333 samples/s/p 4:07:33 } +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1289/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 2.3639259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:22,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43514 samples/s/p 4:07:25 } +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1291/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 2.36341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:25,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 37.9% |██████████████████ | 5.43805 samples/s/p 4:07:14 } +2024-07-25 21:02:27,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1293/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 2.3628942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:27,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43976 samples/s/p 4:07:07 } +2024-07-25 21:02:30,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1295/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.3623785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:30,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43650 samples/s/p 4:07:13 } +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1297/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 2.3618622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:33,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43382 samples/s/p 4:07:17 } +2024-07-25 21:02:36,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1299/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.3613458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:36,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |██████████████████ | 5.43433 samples/s/p 4:07:13 } +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1301/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.3608296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:39,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43127 samples/s/p 4:07:18 } +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1303/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 2.3603132e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:42,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43325 samples/s/p 4:07:10 } +2024-07-25 21:02:45,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1305/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 2.3597966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:45,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.43243 samples/s/p 4:07:09 } +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1307/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 2.3592798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:48,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.0% |███████████████████ | 5.42837 samples/s/p 4:07:17 } +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1309/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.3587627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:51,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43246 samples/s/p 4:07:03 } +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1311/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.3582457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:54,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43243 samples/s/p 4:07:00 } +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1313/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 2.3577282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:02:57,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43002 samples/s/p 4:07:04 } +2024-07-25 21:03:00,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1315/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.3572107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:00,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43699 samples/s/p 4:06:42 } +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1317/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.3566932e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:03,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43349 samples/s/p 4:06:48 } +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1319/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 2.3561757e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:06,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.42922 samples/s/p 4:06:57 } +2024-07-25 21:03:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1321/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3556577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:09,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43693 samples/s/p 4:06:33 } +2024-07-25 21:03:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1323/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.35514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:12,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.1% |███████████████████ | 5.43442 samples/s/p 4:06:37 } +2024-07-25 21:03:15,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1325/ 1625], loss: 0.985, per_step_time: 1472ms, lr: 2.3546214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:15,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43334 samples/s/p 4:06:37 } +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1327/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 2.3541032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:18,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.42419 samples/s/p 4:06:59 } +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1329/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.353585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:21,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43276 samples/s/p 4:06:33 } +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1331/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.3530665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:24,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43911 samples/s/p 4:06:12 } +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1333/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 2.3525474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:26,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43868 samples/s/p 4:06:11 } +2024-07-25 21:03:29,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1335/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.3520286e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:29,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43366 samples/s/p 4:06:21 } +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1337/ 1625], loss: 1.373, per_step_time: 1471ms, lr: 2.3515096e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:32,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43532 samples/s/p 4:06:14 } +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1339/ 1625], loss: 1.259, per_step_time: 1472ms, lr: 2.3509905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:35,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.2% |███████████████████ | 5.43344 samples/s/p 4:06:16 } +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1341/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 2.350471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:38,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43674 samples/s/p 4:06:04 } +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1343/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 2.3499517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43482 samples/s/p 4:06:06 } +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1345/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 2.3494318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:44,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.42341 samples/s/p 4:06:35 } +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1347/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.3489121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:47,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43988 samples/s/p 4:05:47 } +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1349/ 1625], loss: 0.962, per_step_time: 1472ms, lr: 2.348392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:50,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43275 samples/s/p 4:06:03 } +2024-07-25 21:03:53,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1351/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.347872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:53,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43382 samples/s/p 4:05:57 } +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1353/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.3473518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:56,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.44004 samples/s/p 4:05:38 } +2024-07-25 21:03:59,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1355/ 1625], loss: 1.011, per_step_time: 1473ms, lr: 2.3468312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:03:59,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.3% |███████████████████ | 5.43081 samples/s/p 4:06:00 } +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1357/ 1625], loss: 1.483, per_step_time: 1471ms, lr: 2.346311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:02,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43604 samples/s/p 4:05:43 } +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1359/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.3457902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:05,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43310 samples/s/p 4:05:48 } +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1361/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.3452694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:08,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43735 samples/s/p 4:05:33 } +2024-07-25 21:04:11,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1363/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 2.3447485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:11,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43571 samples/s/p 4:05:35 } +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1365/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.3442273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:14,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43551 samples/s/p 4:05:32 } +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1367/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 2.343706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:17,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43136 samples/s/p 4:05:41 } +2024-07-25 21:04:20,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1369/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 2.3431845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:20,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.42786 samples/s/p 4:05:47 } +2024-07-25 21:04:23,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1371/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.342663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:23,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43304 samples/s/p 4:05:30 } +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1373/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.3421413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:26,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.4% |███████████████████ | 5.43155 samples/s/p 4:05:31 } +2024-07-25 21:04:28,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1375/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 2.3416194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:28,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42683 samples/s/p 4:05:41 } +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1377/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.3410974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:31,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43963 samples/s/p 4:05:03 } +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1379/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 2.3405755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:34,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42669 samples/s/p 4:05:36 } +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1381/ 1625], loss: 1.205, per_step_time: 1470ms, lr: 2.340053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:37,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43859 samples/s/p 4:05:00 } +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1383/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 2.3395305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:40,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43507 samples/s/p 4:05:07 } +2024-07-25 21:04:43,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1385/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.3390083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:43,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.43844 samples/s/p 4:04:55 } +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1387/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.3384853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:46,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.44029 samples/s/p 4:04:47 } +2024-07-25 21:04:49,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1389/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 2.3379625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:49,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.5% |███████████████████ | 5.42999 samples/s/p 4:05:12 } +2024-07-25 21:04:52,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1391/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 2.3374394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:52,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43655 samples/s/p 4:04:51 } +2024-07-25 21:04:55,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1393/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.3369164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43656 samples/s/p 4:04:48 } +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1395/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 2.336393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:04:58,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42974 samples/s/p 4:05:04 } +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1397/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.3358696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:01,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43212 samples/s/p 4:04:54 } +2024-07-25 21:05:04,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1399/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.3353461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:04,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43596 samples/s/p 4:04:41 } +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1401/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 2.334822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:07,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43024 samples/s/p 4:04:54 } +2024-07-25 21:05:10,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1403/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.3342984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:10,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.42728 samples/s/p 4:04:59 } +2024-07-25 21:05:13,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1405/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 2.3337743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:13,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.6% |███████████████████ | 5.43022 samples/s/p 4:04:48 } +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1407/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.3332504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:16,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43252 samples/s/p 4:04:39 } +2024-07-25 21:05:19,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1409/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.3327257e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:19,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43232 samples/s/p 4:04:36 } +2024-07-25 21:05:22,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1411/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 2.3322013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:22,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43669 samples/s/p 4:04:21 } +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1413/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 2.3316768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:25,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43182 samples/s/p 4:04:32 } +2024-07-25 21:05:28,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1415/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 2.3311522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:28,007 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44170 samples/s/p 4:04:02 } +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1417/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.3306273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:30,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43199 samples/s/p 4:04:25 } +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1419/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 2.3301021e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:33,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.44002 samples/s/p 4:04:01 } +2024-07-25 21:05:36,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1421/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 2.329577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:36,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.7% |███████████████████ | 5.43104 samples/s/p 4:04:22 } +2024-07-25 21:05:39,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1423/ 1625], loss: 1.090, per_step_time: 1470ms, lr: 2.3290517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:39,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43883 samples/s/p 4:03:58 } +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1425/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.3285264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:42,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43761 samples/s/p 4:03:58 } +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1427/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 2.3280007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:45,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43098 samples/s/p 4:04:13 } +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1429/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 2.3274748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:48,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43315 samples/s/p 4:04:04 } +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1431/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 2.326949e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:51,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.42646 samples/s/p 4:04:20 } +2024-07-25 21:05:54,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1433/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 2.3264229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:54,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43367 samples/s/p 4:03:57 } +2024-07-25 21:05:57,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1435/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.3258966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:05:57,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43615 samples/s/p 4:03:48 } +2024-07-25 21:06:00,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1437/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.3253704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:00,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.8% |███████████████████ | 5.43140 samples/s/p 4:03:57 } +2024-07-25 21:06:03,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1439/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 2.324844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:03,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43036 samples/s/p 4:03:57 } +2024-07-25 21:06:06,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1441/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.324317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:06,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43474 samples/s/p 4:03:42 } +2024-07-25 21:06:09,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1443/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3237904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:09,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43399 samples/s/p 4:03:42 } +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1445/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 2.3232637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:12,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.42552 samples/s/p 4:04:01 } +2024-07-25 21:06:15,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1447/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 2.3227365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:15,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43422 samples/s/p 4:03:35 } +2024-07-25 21:06:18,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1449/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 2.3222094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:18,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43117 samples/s/p 4:03:40 } +2024-07-25 21:06:21,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1451/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 2.321682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:21,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43203 samples/s/p 4:03:35 } +2024-07-25 21:06:24,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1453/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3211544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:24,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 38.9% |███████████████████ | 5.43279 samples/s/p 4:03:30 } +2024-07-25 21:06:27,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1455/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.3206267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:27,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43291 samples/s/p 4:03:27 } +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1457/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.3200992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:29,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43428 samples/s/p 4:03:20 } +2024-07-25 21:06:32,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1459/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.3195713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:32,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43025 samples/s/p 4:03:28 } +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1461/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.319043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:35,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43639 samples/s/p 4:03:09 } +2024-07-25 21:06:38,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1463/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.3185148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:38,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43718 samples/s/p 4:03:04 } +2024-07-25 21:06:41,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1465/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 2.3179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:41,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.44188 samples/s/p 4:02:48 } +2024-07-25 21:06:44,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1467/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.317458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:44,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43397 samples/s/p 4:03:06 } +2024-07-25 21:06:47,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1469/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.3169294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:47,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.0% |███████████████████ | 5.43332 samples/s/p 4:03:05 } +2024-07-25 21:06:50,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1471/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 2.3164008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:50,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43527 samples/s/p 4:02:57 } +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1473/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.3158722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:53,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43818 samples/s/p 4:02:46 } +2024-07-25 21:06:56,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1475/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.3153427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:56,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43226 samples/s/p 4:02:59 } +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1477/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 2.3148137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:06:59,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43471 samples/s/p 4:02:50 } +2024-07-25 21:07:02,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1479/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 2.3142846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:02,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.42821 samples/s/p 4:03:04 } +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1481/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 2.313755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:05,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43507 samples/s/p 4:02:43 } +2024-07-25 21:07:08,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1483/ 1625], loss: 0.946, per_step_time: 1470ms, lr: 2.3132252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:08,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43968 samples/s/p 4:02:27 } +2024-07-25 21:07:11,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1485/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.3126957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:11,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.1% |███████████████████ | 5.43817 samples/s/p 4:02:29 } +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1487/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 2.3121658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:14,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42932 samples/s/p 4:02:49 } +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1489/ 1625], loss: 0.995, per_step_time: 1472ms, lr: 2.3116358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:17,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43135 samples/s/p 4:02:41 } +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1491/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 2.3111055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:20,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43317 samples/s/p 4:02:33 } +2024-07-25 21:07:23,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1493/ 1625], loss: 0.977, per_step_time: 1472ms, lr: 2.3105753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:23,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43110 samples/s/p 4:02:36 } +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1495/ 1625], loss: 1.279, per_step_time: 1471ms, lr: 2.310045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:26,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43809 samples/s/p 4:02:14 } +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1497/ 1625], loss: 0.863, per_step_time: 1473ms, lr: 2.3095143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:29,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.42902 samples/s/p 4:02:35 } +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1499/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.3089835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:31,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43590 samples/s/p 4:02:14 } +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1501/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 2.3084529e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:34,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43567 samples/s/p 4:02:12 } +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1503/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.307922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:37,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.2% |███████████████████ | 5.43622 samples/s/p 4:02:07 } +2024-07-25 21:07:40,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1505/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 2.3073904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:40,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43368 samples/s/p 4:02:11 } +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1507/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3068595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:43,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43737 samples/s/p 4:01:58 } +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1509/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.306328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:46,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43194 samples/s/p 4:02:10 } +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1511/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 2.3057966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:49,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43798 samples/s/p 4:01:51 } +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1513/ 1625], loss: 1.062, per_step_time: 1473ms, lr: 2.3052648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:52,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.42917 samples/s/p 4:02:11 } +2024-07-25 21:07:55,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1515/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3047329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:55,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43258 samples/s/p 4:01:59 } +2024-07-25 21:07:58,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1517/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 2.3042008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:07:58,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43225 samples/s/p 4:01:57 } +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1519/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3036688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:01,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.3% |███████████████████ | 5.43265 samples/s/p 4:01:53 } +2024-07-25 21:08:04,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1521/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.3031364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:04,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43727 samples/s/p 4:01:38 } +2024-07-25 21:08:07,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1523/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 2.302604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:07,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43688 samples/s/p 4:01:36 } +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1525/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.3020715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:10,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43726 samples/s/p 4:01:32 } +2024-07-25 21:08:13,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1527/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.301539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:13,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43720 samples/s/p 4:01:29 } +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1529/ 1625], loss: 1.072, per_step_time: 1473ms, lr: 2.301006e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:16,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.42945 samples/s/p 4:01:47 } +2024-07-25 21:08:19,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1531/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.300473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:19,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43550 samples/s/p 4:01:28 } +2024-07-25 21:08:22,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1533/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 2.29994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:22,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43084 samples/s/p 4:01:37 } +2024-07-25 21:08:25,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1535/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 2.2994067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:25,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.4% |███████████████████ | 5.43513 samples/s/p 4:01:23 } +2024-07-25 21:08:28,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1537/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 2.2988734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:28,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43770 samples/s/p 4:01:13 } +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1539/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.2983397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:30,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43540 samples/s/p 4:01:16 } +2024-07-25 21:08:33,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1541/ 1625], loss: 1.210, per_step_time: 1474ms, lr: 2.2978062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:33,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.42654 samples/s/p 4:01:37 } +2024-07-25 21:08:36,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1543/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.2972723e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:36,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43136 samples/s/p 4:01:21 } +2024-07-25 21:08:39,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1545/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 2.2967384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:39,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43257 samples/s/p 4:01:15 } +2024-07-25 21:08:42,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1547/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2962042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:42,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43843 samples/s/p 4:00:57 } +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1549/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.2956701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:45,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43532 samples/s/p 4:01:02 } +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1551/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.2951357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:48,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.5% |███████████████████ | 5.43803 samples/s/p 4:00:52 } +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1553/ 1625], loss: 1.106, per_step_time: 1474ms, lr: 2.2946011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:51,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42539 samples/s/p 4:01:23 } +2024-07-25 21:08:54,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1555/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.2940667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:54,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43447 samples/s/p 4:00:55 } +2024-07-25 21:08:57,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1557/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 2.2935319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:08:57,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43626 samples/s/p 4:00:48 } +2024-07-25 21:09:00,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1559/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.2929971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:00,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43596 samples/s/p 4:00:46 } +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1561/ 1625], loss: 1.404, per_step_time: 1473ms, lr: 2.292462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:03,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.42859 samples/s/p 4:01:02 } +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1563/ 1625], loss: 1.004, per_step_time: 1472ms, lr: 2.2919272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:06,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43376 samples/s/p 4:00:45 } +2024-07-25 21:09:09,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1565/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 2.2913915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:09,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43400 samples/s/p 4:00:42 } +2024-07-25 21:09:12,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1567/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.2908564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:12,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.6% |███████████████████ | 5.43629 samples/s/p 4:00:33 } +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1569/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.2903208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:15,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43171 samples/s/p 4:00:42 } +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1571/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 2.2897852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:18,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43249 samples/s/p 4:00:37 } +2024-07-25 21:09:21,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1573/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 2.2892493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:21,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43161 samples/s/p 4:00:36 } +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1575/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.288713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:24,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43787 samples/s/p 4:00:17 } +2024-07-25 21:09:27,078 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1577/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.2881772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:27,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43602 samples/s/p 4:00:19 } +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1579/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.2876407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:30,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43158 samples/s/p 4:00:28 } +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1581/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.2871045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:32,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43183 samples/s/p 4:00:24 } +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1583/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 2.286568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:35,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.7% |███████████████████ | 5.43404 samples/s/p 4:00:15 } +2024-07-25 21:09:38,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1585/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2860315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:38,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43505 samples/s/p 4:00:10 } +2024-07-25 21:09:41,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1587/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.2854943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:41,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43678 samples/s/p 4:00:02 } +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1589/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 2.2849577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:44,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.42969 samples/s/p 4:00:18 } +2024-07-25 21:09:47,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1591/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2844208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:47,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43727 samples/s/p 3:59:55 } +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1593/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.2838836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:50,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43567 samples/s/p 3:59:56 } +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1595/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.283346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:53,638 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43955 samples/s/p 3:59:43 } +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1597/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 2.2828086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:56,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.43356 samples/s/p 3:59:56 } +2024-07-25 21:09:59,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1599/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 2.282271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:09:59,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.8% |███████████████████ | 5.44071 samples/s/p 3:59:34 } +2024-07-25 21:10:02,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1601/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.2817332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:02,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43664 samples/s/p 3:59:42 } +2024-07-25 21:10:05,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1603/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.2811953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:05,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43688 samples/s/p 3:59:38 } +2024-07-25 21:10:08,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1605/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.2806575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:08,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43916 samples/s/p 3:59:29 } +2024-07-25 21:10:11,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1607/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 2.2801192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:11,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43258 samples/s/p 3:59:44 } +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1609/ 1625], loss: 1.211, per_step_time: 1470ms, lr: 2.279581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:14,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43965 samples/s/p 3:59:22 } +2024-07-25 21:10:17,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1611/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.2790426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:17,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43236 samples/s/p 3:59:39 } +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1613/ 1625], loss: 1.236, per_step_time: 1476ms, lr: 2.278504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:20,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.41891 samples/s/p 4:00:11 } +2024-07-25 21:10:23,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1615/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2779652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:23,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 39.9% |███████████████████ | 5.43709 samples/s/p 3:59:20 } +2024-07-25 21:10:26,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1617/ 1625], loss: 0.985, per_step_time: 1472ms, lr: 2.2774264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:26,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43423 samples/s/p 3:59:25 } +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1619/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 2.2768874e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:29,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43762 samples/s/p 3:59:13 } +2024-07-25 21:10:32,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1621/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 2.2763483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:32,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43425 samples/s/p 3:59:19 } +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1623/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 2.2758091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:34,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |███████████████████ | 5.43684 samples/s/p 3:59:09 } +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 4/ 10], step:[ 1625/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 2.2752696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:37,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43695 samples/s/p 3:59:06 } +2024-07-25 21:10:40,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 2/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 2.2747303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:40,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43518 samples/s/p 3:59:08 } +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 4/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.2741906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:43,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43424 samples/s/p 3:59:07 } +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 6/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 2.2736509e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:46,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.42820 samples/s/p 3:59:20 } +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 8/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 2.2731108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:49,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.0% |████████████████████ | 5.43469 samples/s/p 3:59:00 } +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 10/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 2.2725708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:52,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43824 samples/s/p 3:58:48 } +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 12/ 1625], loss: 1.227, per_step_time: 1478ms, lr: 2.2720307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:55,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.41136 samples/s/p 3:59:56 } +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 14/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 2.2714903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:10:58,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43454 samples/s/p 3:58:52 } +2024-07-25 21:11:01,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 16/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 2.27095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:01,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42856 samples/s/p 3:59:04 } +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 18/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 2.2704093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:04,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43504 samples/s/p 3:58:44 } +2024-07-25 21:11:07,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 20/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 2.2698687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:07,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.42845 samples/s/p 3:58:59 } +2024-07-25 21:11:10,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 22/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.2693279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:10,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.44004 samples/s/p 3:58:25 } +2024-07-25 21:11:13,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 24/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 2.268787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:13,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.1% |████████████████████ | 5.43094 samples/s/p 3:58:46 } +2024-07-25 21:11:16,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 26/ 1625], loss: 1.157, per_step_time: 1469ms, lr: 2.2682461e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:16,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.44457 samples/s/p 3:58:07 } +2024-07-25 21:11:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 28/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.2677044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:19,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43516 samples/s/p 3:58:29 } +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 30/ 1625], loss: 1.344, per_step_time: 1474ms, lr: 2.2671631e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.42643 samples/s/p 3:58:49 } +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 32/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.2666221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43251 samples/s/p 3:58:30 } +2024-07-25 21:11:28,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 34/ 1625], loss: 1.310, per_step_time: 1472ms, lr: 2.2660804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:28,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43180 samples/s/p 3:58:29 } +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 36/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2655384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:31,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43550 samples/s/p 3:58:17 } +2024-07-25 21:11:33,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 38/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 2.2649967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:33,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43128 samples/s/p 3:58:25 } +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 40/ 1625], loss: 1.410, per_step_time: 1471ms, lr: 2.2644546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:36,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.2% |████████████████████ | 5.43729 samples/s/p 3:58:06 } +2024-07-25 21:11:39,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 42/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.2639124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:39,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43645 samples/s/p 3:58:05 } +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 44/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2633702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:42,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43870 samples/s/p 3:57:56 } +2024-07-25 21:11:45,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 46/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.2628277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:45,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43919 samples/s/p 3:57:52 } +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 48/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 2.2622855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:48,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43560 samples/s/p 3:57:59 } +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 50/ 1625], loss: 1.264, per_step_time: 1474ms, lr: 2.2617425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:51,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42718 samples/s/p 3:58:18 } +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 52/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 2.2611997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:54,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.42707 samples/s/p 3:58:15 } +2024-07-25 21:11:57,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 54/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2606571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:11:57,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43740 samples/s/p 3:57:45 } +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 56/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 2.260114e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:00,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.3% |████████████████████ | 5.43236 samples/s/p 3:57:55 } +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 58/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.2595706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:03,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43614 samples/s/p 3:57:43 } +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 60/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.2590275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:06,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43231 samples/s/p 3:57:50 } +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 62/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 2.258484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:09,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43458 samples/s/p 3:57:41 } +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 64/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 2.2579403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43638 samples/s/p 3:57:33 } +2024-07-25 21:12:15,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 66/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 2.2573966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:15,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43742 samples/s/p 3:57:27 } +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 68/ 1625], loss: 1.121, per_step_time: 1477ms, lr: 2.2568527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:18,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.41538 samples/s/p 3:58:22 } +2024-07-25 21:12:21,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 70/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.2563088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:21,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43511 samples/s/p 3:57:28 } +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 72/ 1625], loss: 1.486, per_step_time: 1472ms, lr: 2.2557646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:24,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.4% |████████████████████ | 5.43299 samples/s/p 3:57:30 } +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 74/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.2552204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:27,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43140 samples/s/p 3:57:31 } +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 76/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.254676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:30,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43576 samples/s/p 3:57:17 } +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 78/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 2.2541315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:33,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43714 samples/s/p 3:57:11 } +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 80/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 2.2535869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:35,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43070 samples/s/p 3:57:24 } +2024-07-25 21:12:38,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 82/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 2.2530421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:38,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43569 samples/s/p 3:57:08 } +2024-07-25 21:12:41,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 84/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 2.2524971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:41,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43308 samples/s/p 3:57:12 } +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 86/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.2519522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:44,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.43357 samples/s/p 3:57:08 } +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 88/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 2.251407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:47,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.5% |████████████████████ | 5.42710 samples/s/p 3:57:22 } +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 90/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 2.2508617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:50,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.42380 samples/s/p 3:57:28 } +2024-07-25 21:12:53,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 92/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.2503164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43869 samples/s/p 3:56:46 } +2024-07-25 21:12:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 94/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.2497707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43752 samples/s/p 3:56:46 } +2024-07-25 21:12:59,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 96/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.2492251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:12:59,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43526 samples/s/p 3:56:49 } +2024-07-25 21:13:02,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 98/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 2.2486793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:02,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43715 samples/s/p 3:56:41 } +2024-07-25 21:13:05,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 100/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 2.2481334e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:05,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43399 samples/s/p 3:56:46 } +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 102/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2475871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:08,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.43636 samples/s/p 3:56:37 } +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 104/ 1625], loss: 1.066, per_step_time: 1469ms, lr: 2.247041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.6% |████████████████████ | 5.44220 samples/s/p 3:56:19 } +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 106/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 2.2464947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:14,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43843 samples/s/p 3:56:26 } +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 108/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 2.245948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:17,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.44190 samples/s/p 3:56:14 } +2024-07-25 21:13:20,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 110/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.2454016e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:20,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43019 samples/s/p 3:56:42 } +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 112/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 2.2448548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:23,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43740 samples/s/p 3:56:20 } +2024-07-25 21:13:26,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 114/ 1625], loss: 0.954, per_step_time: 1470ms, lr: 2.244308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:26,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.44026 samples/s/p 3:56:09 } +2024-07-25 21:13:29,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 116/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.2437613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:29,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.42918 samples/s/p 3:56:35 } +2024-07-25 21:13:32,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 118/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 2.243214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:32,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43059 samples/s/p 3:56:29 } +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 120/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 2.242667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:34,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.7% |████████████████████ | 5.43214 samples/s/p 3:56:22 } +2024-07-25 21:13:37,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 122/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 2.2421198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43362 samples/s/p 3:56:15 } +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 124/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 2.2415721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:40,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43734 samples/s/p 3:56:02 } +2024-07-25 21:13:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 126/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.2410246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42935 samples/s/p 3:56:20 } +2024-07-25 21:13:46,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 128/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2404767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:46,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43285 samples/s/p 3:56:08 } +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 130/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 2.239929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:49,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.42857 samples/s/p 3:56:16 } +2024-07-25 21:13:52,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 132/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.2393811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:52,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43838 samples/s/p 3:55:48 } +2024-07-25 21:13:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 134/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 2.2388327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:55,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43677 samples/s/p 3:55:49 } +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 136/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 2.2382847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:13:58,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43222 samples/s/p 3:55:58 } +2024-07-25 21:14:01,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 138/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 2.2377366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:01,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.8% |████████████████████ | 5.43787 samples/s/p 3:55:40 } +2024-07-25 21:14:04,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 140/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 2.2371878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:04,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43977 samples/s/p 3:55:32 } +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 142/ 1625], loss: 1.356, per_step_time: 1472ms, lr: 2.2366394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:07,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43114 samples/s/p 3:55:52 } +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 144/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2360906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:10,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43292 samples/s/p 3:55:44 } +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 146/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.2355418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:13,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43508 samples/s/p 3:55:36 } +2024-07-25 21:14:16,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 148/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.2349928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:16,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43352 samples/s/p 3:55:37 } +2024-07-25 21:14:19,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 150/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2344437e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:19,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43697 samples/s/p 3:55:25 } +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 152/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 2.2338943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:22,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43206 samples/s/p 3:55:35 } +2024-07-25 21:14:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 154/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 2.233345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 40.9% |████████████████████ | 5.43880 samples/s/p 3:55:14 } +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 156/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.2327955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:28,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43207 samples/s/p 3:55:29 } +2024-07-25 21:14:31,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 158/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 2.232246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:31,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.42919 samples/s/p 3:55:33 } +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 160/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 2.2316963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:34,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43524 samples/s/p 3:55:15 } +2024-07-25 21:14:36,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 162/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.2311464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:36,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43344 samples/s/p 3:55:17 } +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 164/ 1625], loss: 1.055, per_step_time: 1469ms, lr: 2.2305963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:39,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.44285 samples/s/p 3:54:49 } +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 166/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 2.230046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:42,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43332 samples/s/p 3:55:11 } +2024-07-25 21:14:45,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 168/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 2.229496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:45,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43076 samples/s/p 3:55:15 } +2024-07-25 21:14:48,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 170/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 2.2289454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:48,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.0% |████████████████████ | 5.43744 samples/s/p 3:54:54 } +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 172/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 2.2283948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:51,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.42948 samples/s/p 3:55:12 } +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 174/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2278444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:54,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44094 samples/s/p 3:54:39 } +2024-07-25 21:14:57,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 176/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.2272936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:14:57,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43343 samples/s/p 3:54:56 } +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 178/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 2.2267428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:00,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43560 samples/s/p 3:54:47 } +2024-07-25 21:15:03,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 180/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 2.2261916e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:03,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44245 samples/s/p 3:54:27 } +2024-07-25 21:15:06,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 182/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 2.2256405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:06,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43716 samples/s/p 3:54:37 } +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 184/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 2.2250892e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:09,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.43479 samples/s/p 3:54:41 } +2024-07-25 21:15:12,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 186/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 2.2245378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:12,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.1% |████████████████████ | 5.44171 samples/s/p 3:54:20 } +2024-07-25 21:15:15,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 188/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 2.2239865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:15,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43657 samples/s/p 3:54:30 } +2024-07-25 21:15:18,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 190/ 1625], loss: 1.009, per_step_time: 1469ms, lr: 2.2234346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:18,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.44358 samples/s/p 3:54:09 } +2024-07-25 21:15:21,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 192/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 2.2228829e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:21,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43519 samples/s/p 3:54:28 } +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 194/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.222331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:24,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43193 samples/s/p 3:54:33 } +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 196/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 2.2217791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:27,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43236 samples/s/p 3:54:29 } +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 198/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.2212269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:30,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43908 samples/s/p 3:54:09 } +2024-07-25 21:15:33,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 200/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.2206747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:33,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43389 samples/s/p 3:54:19 } +2024-07-25 21:15:35,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 202/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 2.2201222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:35,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.2% |████████████████████ | 5.43089 samples/s/p 3:54:24 } +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 204/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 2.21957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:38,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43006 samples/s/p 3:54:23 } +2024-07-25 21:15:41,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 206/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2190172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:41,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.44198 samples/s/p 3:53:50 } +2024-07-25 21:15:44,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 208/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.2184644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:44,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43229 samples/s/p 3:54:12 } +2024-07-25 21:15:47,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 210/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.2179118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:47,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43296 samples/s/p 3:54:07 } +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 212/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2173588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:50,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43582 samples/s/p 3:53:57 } +2024-07-25 21:15:53,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 214/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 2.2168053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:53,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.42986 samples/s/p 3:54:09 } +2024-07-25 21:15:56,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 216/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 2.2162525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:56,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43454 samples/s/p 3:53:54 } +2024-07-25 21:15:59,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.2156992e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:15:59,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.3% |████████████████████ | 5.43664 samples/s/p 3:53:46 } +2024-07-25 21:16:02,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 220/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.2151457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:02,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43692 samples/s/p 3:53:42 } +2024-07-25 21:16:05,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 222/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.214592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:05,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43648 samples/s/p 3:53:40 } +2024-07-25 21:16:08,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 224/ 1625], loss: 0.893, per_step_time: 1471ms, lr: 2.2140382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:08,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43684 samples/s/p 3:53:36 } +2024-07-25 21:16:11,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 226/ 1625], loss: 1.085, per_step_time: 1470ms, lr: 2.2134847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:11,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43848 samples/s/p 3:53:29 } +2024-07-25 21:16:14,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 228/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.2129307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:14,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43402 samples/s/p 3:53:38 } +2024-07-25 21:16:17,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 230/ 1625], loss: 0.865, per_step_time: 1471ms, lr: 2.2123762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:17,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43532 samples/s/p 3:53:32 } +2024-07-25 21:16:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 232/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 2.2118224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43192 samples/s/p 3:53:37 } +2024-07-25 21:16:23,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 234/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.211268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:23,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.4% |████████████████████ | 5.43315 samples/s/p 3:53:31 } +2024-07-25 21:16:26,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 236/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 2.2107135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:26,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43274 samples/s/p 3:53:29 } +2024-07-25 21:16:29,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 238/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 2.210159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:29,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43699 samples/s/p 3:53:15 } +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 240/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 2.2096043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:32,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43585 samples/s/p 3:53:15 } +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 242/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.2090495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43626 samples/s/p 3:53:11 } +2024-07-25 21:16:37,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 244/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.2084943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:37,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43729 samples/s/p 3:53:06 } +2024-07-25 21:16:40,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.2079394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:40,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43511 samples/s/p 3:53:09 } +2024-07-25 21:16:43,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 248/ 1625], loss: 1.072, per_step_time: 1473ms, lr: 2.2073842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:43,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43102 samples/s/p 3:53:16 } +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 250/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 2.2068289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:46,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.5% |████████████████████ | 5.43565 samples/s/p 3:53:01 } +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 252/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.2062733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:49,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43823 samples/s/p 3:52:52 } +2024-07-25 21:16:52,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 254/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.2057178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:52,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42982 samples/s/p 3:53:10 } +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 256/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 2.2051621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:55,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43187 samples/s/p 3:53:02 } +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 258/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 2.2046064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:16:58,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43043 samples/s/p 3:53:03 } +2024-07-25 21:17:01,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 260/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.2040504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:01,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43554 samples/s/p 3:52:47 } +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 262/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 2.2034943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:04,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43405 samples/s/p 3:52:48 } +2024-07-25 21:17:07,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 264/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 2.2029382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:07,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.42970 samples/s/p 3:52:56 } +2024-07-25 21:17:10,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 266/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 2.2023818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:10,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.43298 samples/s/p 3:52:45 } +2024-07-25 21:17:13,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 268/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 2.2018256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:13,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.6% |████████████████████ | 5.44015 samples/s/p 3:52:23 } +2024-07-25 21:17:16,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 270/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 2.201269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:16,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.42958 samples/s/p 3:52:47 } +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 272/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 2.2007122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:19,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44055 samples/s/p 3:52:16 } +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 274/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 2.2001554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:22,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43873 samples/s/p 3:52:18 } +2024-07-25 21:17:25,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 276/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1995987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:25,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44059 samples/s/p 3:52:10 } +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 278/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 2.1990416e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:28,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43685 samples/s/p 3:52:17 } +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 280/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 2.1984844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:31,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.44088 samples/s/p 3:52:04 } +2024-07-25 21:17:34,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 282/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 2.1979271e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:34,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43194 samples/s/p 3:52:24 } +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 284/ 1625], loss: 1.397, per_step_time: 1470ms, lr: 2.19737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:36,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.7% |████████████████████ | 5.43865 samples/s/p 3:52:04 } +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 286/ 1625], loss: 1.279, per_step_time: 1475ms, lr: 2.1968124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:39,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42193 samples/s/p 3:52:44 } +2024-07-25 21:17:42,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 288/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 2.1962549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:42,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43086 samples/s/p 3:52:18 } +2024-07-25 21:17:45,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 290/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.195697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:45,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43779 samples/s/p 3:51:57 } +2024-07-25 21:17:48,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 292/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.1951395e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:48,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43832 samples/s/p 3:51:53 } +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 294/ 1625], loss: 1.277, per_step_time: 1472ms, lr: 2.1945816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:51,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43253 samples/s/p 3:52:05 } +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 296/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.1940232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:54,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.42905 samples/s/p 3:52:10 } +2024-07-25 21:17:57,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 298/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.1934653e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:17:57,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43731 samples/s/p 3:51:46 } +2024-07-25 21:18:00,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 300/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 2.192907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:00,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.8% |████████████████████ | 5.43489 samples/s/p 3:51:50 } +2024-07-25 21:18:03,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 302/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1923484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:03,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43532 samples/s/p 3:51:46 } +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 304/ 1625], loss: 1.182, per_step_time: 1473ms, lr: 2.1917898e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:06,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42774 samples/s/p 3:52:02 } +2024-07-25 21:18:09,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 306/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 2.1912314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:09,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43251 samples/s/p 3:51:47 } +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 308/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1906724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:12,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42791 samples/s/p 3:51:56 } +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 310/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 2.1901134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.43412 samples/s/p 3:51:37 } +2024-07-25 21:18:18,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 312/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 2.1895545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:18,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.42723 samples/s/p 3:51:52 } +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 314/ 1625], loss: 1.071, per_step_time: 1477ms, lr: 2.1889953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:21,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.41521 samples/s/p 3:52:19 } +2024-07-25 21:18:24,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 316/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 2.1884363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:24,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 41.9% |████████████████████ | 5.44043 samples/s/p 3:51:12 } +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 318/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 2.1878766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:27,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43400 samples/s/p 3:51:25 } +2024-07-25 21:18:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 320/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 2.1873175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.42997 samples/s/p 3:51:33 } +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 322/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 2.186758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43060 samples/s/p 3:51:28 } +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 324/ 1625], loss: 0.832, per_step_time: 1472ms, lr: 2.1861983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:36,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |████████████████████ | 5.43468 samples/s/p 3:51:15 } +2024-07-25 21:18:38,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 326/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 2.1856382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:38,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.44043 samples/s/p 3:50:57 } +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 328/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 2.1850783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:41,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43642 samples/s/p 3:51:05 } +2024-07-25 21:18:44,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 330/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1845182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:44,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43382 samples/s/p 3:51:08 } +2024-07-25 21:18:47,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 332/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 2.183958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:47,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.0% |█████████████████████ | 5.43470 samples/s/p 3:51:03 } +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 334/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.1833976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:50,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43612 samples/s/p 3:50:56 } +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 336/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 2.1828373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:53,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43950 samples/s/p 3:50:45 } +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 338/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 2.1822767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:56,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43821 samples/s/p 3:50:45 } +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 340/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.1817159e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:18:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43318 samples/s/p 3:50:55 } +2024-07-25 21:19:02,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 342/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 2.1811553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:02,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43899 samples/s/p 3:50:37 } +2024-07-25 21:19:05,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 344/ 1625], loss: 1.367, per_step_time: 1471ms, lr: 2.1805943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:05,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43646 samples/s/p 3:50:41 } +2024-07-25 21:19:08,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 346/ 1625], loss: 1.228, per_step_time: 1471ms, lr: 2.1800332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:08,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43564 samples/s/p 3:50:40 } +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 348/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.1794722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:11,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.1% |█████████████████████ | 5.43793 samples/s/p 3:50:31 } +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 350/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 2.1789108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:14,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43957 samples/s/p 3:50:24 } +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 352/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.1783495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:17,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43422 samples/s/p 3:50:35 } +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 354/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.177788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:20,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43788 samples/s/p 3:50:23 } +2024-07-25 21:19:23,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 356/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 2.1772265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:23,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44102 samples/s/p 3:50:12 } +2024-07-25 21:19:26,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 358/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 2.1766646e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:26,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43282 samples/s/p 3:50:30 } +2024-07-25 21:19:29,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 360/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.1761029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:29,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43610 samples/s/p 3:50:18 } +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 362/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 2.1755408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:32,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.43038 samples/s/p 3:50:30 } +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 364/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 2.1749787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:35,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.2% |█████████████████████ | 5.44012 samples/s/p 3:50:02 } +2024-07-25 21:19:37,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 366/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 2.1744167e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:37,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43573 samples/s/p 3:50:10 } +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 368/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 2.1738544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:40,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44078 samples/s/p 3:49:55 } +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 370/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 2.173292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43584 samples/s/p 3:50:04 } +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 372/ 1625], loss: 0.984, per_step_time: 1469ms, lr: 2.1727295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:46,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.44425 samples/s/p 3:49:40 } +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 374/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1721668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:49,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43613 samples/s/p 3:49:58 } +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 376/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 2.1716038e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:52,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43286 samples/s/p 3:50:03 } +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 378/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 2.171041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:55,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43439 samples/s/p 3:49:56 } +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 380/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.170478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:19:58,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.3% |█████████████████████ | 5.43705 samples/s/p 3:49:46 } +2024-07-25 21:20:01,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 382/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.1699154e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:01,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43209 samples/s/p 3:49:56 } +2024-07-25 21:20:04,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 384/ 1625], loss: 1.186, per_step_time: 1469ms, lr: 2.169352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:04,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.44361 samples/s/p 3:49:24 } +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 386/ 1625], loss: 1.215, per_step_time: 1474ms, lr: 2.1687883e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:07,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42524 samples/s/p 3:50:08 } +2024-07-25 21:20:10,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 388/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 2.1682252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:10,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43525 samples/s/p 3:49:39 } +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 390/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 2.1676618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:13,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42972 samples/s/p 3:49:50 } +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 392/ 1625], loss: 1.020, per_step_time: 1473ms, lr: 2.1670981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:16,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.42910 samples/s/p 3:49:49 } +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 394/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.1665343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:19,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43134 samples/s/p 3:49:40 } +2024-07-25 21:20:22,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 396/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.1659704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:22,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43762 samples/s/p 3:49:21 } +2024-07-25 21:20:25,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 398/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 2.1654067e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:25,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.4% |█████████████████████ | 5.43061 samples/s/p 3:49:36 } +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 400/ 1625], loss: 1.293, per_step_time: 1473ms, lr: 2.1648422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:28,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43052 samples/s/p 3:49:34 } +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 402/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 2.164278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:31,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43452 samples/s/p 3:49:20 } +2024-07-25 21:20:34,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 404/ 1625], loss: 1.232, per_step_time: 1474ms, lr: 2.1637139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:34,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42422 samples/s/p 3:49:44 } +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 406/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.1631497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:36,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.44069 samples/s/p 3:48:59 } +2024-07-25 21:20:39,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 408/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 2.1625845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:39,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43156 samples/s/p 3:49:19 } +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 410/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.1620202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:42,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43556 samples/s/p 3:49:06 } +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 412/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 2.1614554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:45,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.43983 samples/s/p 3:48:52 } +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 414/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 2.1608905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:48,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.5% |█████████████████████ | 5.42929 samples/s/p 3:49:16 } +2024-07-25 21:20:51,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 416/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 2.1603255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:51,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43894 samples/s/p 3:48:49 } +2024-07-25 21:20:54,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 418/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 2.1597603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:54,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43819 samples/s/p 3:48:48 } +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 420/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 2.159195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:20:57,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.42705 samples/s/p 3:49:13 } +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 422/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.1586296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:00,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43612 samples/s/p 3:48:47 } +2024-07-25 21:21:03,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 424/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 2.1580643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:03,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43913 samples/s/p 3:48:36 } +2024-07-25 21:21:06,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 426/ 1625], loss: 1.124, per_step_time: 1469ms, lr: 2.1574986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:06,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44231 samples/s/p 3:48:25 } +2024-07-25 21:21:09,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 428/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.1569329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:09,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.43828 samples/s/p 3:48:33 } +2024-07-25 21:21:12,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 430/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.1563672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:12,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.6% |█████████████████████ | 5.44080 samples/s/p 3:48:23 } +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 432/ 1625], loss: 1.040, per_step_time: 1470ms, lr: 2.1558013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:15,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44027 samples/s/p 3:48:22 } +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 434/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 2.1552352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43403 samples/s/p 3:48:35 } +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 436/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 2.1546688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:21,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43769 samples/s/p 3:48:22 } +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 438/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.1541025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:24,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42863 samples/s/p 3:48:42 } +2024-07-25 21:21:27,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 440/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 2.1535363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:27,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43325 samples/s/p 3:48:28 } +2024-07-25 21:21:30,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 442/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.1529699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:30,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.43449 samples/s/p 3:48:22 } +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 444/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 2.1524032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:33,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.42985 samples/s/p 3:48:30 } +2024-07-25 21:21:36,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 446/ 1625], loss: 1.057, per_step_time: 1469ms, lr: 2.1518365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:36,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.7% |█████████████████████ | 5.44268 samples/s/p 3:47:55 } +2024-07-25 21:21:38,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 448/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.1512697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:38,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43487 samples/s/p 3:48:12 } +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 450/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 2.1507029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:41,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43170 samples/s/p 3:48:17 } +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 452/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 2.1501357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:44,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43252 samples/s/p 3:48:12 } +2024-07-25 21:21:47,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 454/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 2.1495687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:47,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.42487 samples/s/p 3:48:28 } +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 456/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 2.1490014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:50,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43461 samples/s/p 3:48:01 } +2024-07-25 21:21:53,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 458/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.148434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:53,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43209 samples/s/p 3:48:04 } +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 460/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 2.1478665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:56,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43743 samples/s/p 3:47:48 } +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 462/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 2.147299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:21:59,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.8% |█████████████████████ | 5.43705 samples/s/p 3:47:46 } +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 464/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 2.1467313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:02,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43403 samples/s/p 3:47:50 } +2024-07-25 21:22:05,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 466/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.1461634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:05,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43008 samples/s/p 3:47:57 } +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 468/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 2.1455955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:08,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43421 samples/s/p 3:47:44 } +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 470/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 2.1450276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:11,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43642 samples/s/p 3:47:36 } +2024-07-25 21:22:14,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 472/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 2.1444595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:14,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43298 samples/s/p 3:47:41 } +2024-07-25 21:22:17,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 474/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.143891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:17,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.44175 samples/s/p 3:47:16 } +2024-07-25 21:22:20,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 476/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 2.1433229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:20,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43495 samples/s/p 3:47:30 } +2024-07-25 21:22:23,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 478/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 2.1427542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 42.9% |█████████████████████ | 5.43108 samples/s/p 3:47:37 } +2024-07-25 21:22:26,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 480/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 2.1421858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:26,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43614 samples/s/p 3:47:22 } +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.141617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:29,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43897 samples/s/p 3:47:12 } +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 484/ 1625], loss: 1.018, per_step_time: 1469ms, lr: 2.1410482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:32,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44279 samples/s/p 3:46:59 } +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 486/ 1625], loss: 1.282, per_step_time: 1468ms, lr: 2.1404794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:35,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44696 samples/s/p 3:46:46 } +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 488/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.1399102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:37,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43530 samples/s/p 3:47:12 } +2024-07-25 21:22:40,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 490/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.139341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:40,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.44167 samples/s/p 3:46:53 } +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 492/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 2.1387721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:43,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43523 samples/s/p 3:47:06 } +2024-07-25 21:22:46,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 494/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 2.1382028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:46,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.0% |█████████████████████ | 5.43323 samples/s/p 3:47:08 } +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 496/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 2.137633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:49,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43728 samples/s/p 3:46:55 } +2024-07-25 21:22:52,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 498/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.1370637e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:52,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43364 samples/s/p 3:47:01 } +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 500/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 2.136494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:22:55,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43864 samples/s/p 3:46:46 } +2024-07-25 21:22:55,671 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 502/ 1625], loss: 1.250, per_step_time: 2148ms, lr: 2.1359243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:31,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 3.72293 samples/s/p 5:31:12 } +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 504/ 1625], loss: 1.230, per_step_time: 1475ms, lr: 2.1353544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:34,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.42037 samples/s/p 3:47:26 } +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 506/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.1347843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:37,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43432 samples/s/p 3:46:48 } +2024-07-25 21:23:40,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 508/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 2.1342143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:40,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43045 samples/s/p 3:46:55 } +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 510/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 2.133644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:43,178 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.1% |█████████████████████ | 5.43522 samples/s/p 3:46:40 } +2024-07-25 21:23:46,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 512/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 2.1330738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:46,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43029 samples/s/p 3:46:49 } +2024-07-25 21:23:49,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 514/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 2.1325033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:49,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43848 samples/s/p 3:46:26 } +2024-07-25 21:23:52,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 516/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 2.1319329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:52,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43052 samples/s/p 3:46:43 } +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 2.1313623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:54,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43267 samples/s/p 3:46:34 } +2024-07-25 21:23:57,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 520/ 1625], loss: 1.310, per_step_time: 1473ms, lr: 2.1307915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:23:57,940 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43001 samples/s/p 3:46:38 } +2024-07-25 21:24:00,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 522/ 1625], loss: 1.320, per_step_time: 1471ms, lr: 2.1302207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:00,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43804 samples/s/p 3:46:15 } +2024-07-25 21:24:03,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 524/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.1296497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:03,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43590 samples/s/p 3:46:17 } +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 526/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 2.1290785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:06,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43385 samples/s/p 3:46:20 } +2024-07-25 21:24:09,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 528/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.1285074e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:09,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.2% |█████████████████████ | 5.43715 samples/s/p 3:46:08 } +2024-07-25 21:24:12,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 530/ 1625], loss: 1.178, per_step_time: 1469ms, lr: 2.1279362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:12,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.44398 samples/s/p 3:45:48 } +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 532/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 2.1273649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:15,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43892 samples/s/p 3:45:58 } +2024-07-25 21:24:18,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 534/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.1267933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:18,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43539 samples/s/p 3:46:04 } +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 536/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.1262214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:21,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43417 samples/s/p 3:46:04 } +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 538/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 2.1256501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:24,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43593 samples/s/p 3:45:57 } +2024-07-25 21:24:27,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 540/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 2.125078e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:27,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43524 samples/s/p 3:45:55 } +2024-07-25 21:24:30,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 542/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 2.1245063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:30,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43653 samples/s/p 3:45:49 } +2024-07-25 21:24:33,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 544/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 2.1239342e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:33,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.3% |█████████████████████ | 5.43262 samples/s/p 3:45:56 } +2024-07-25 21:24:36,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 546/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 2.1233622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:36,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44120 samples/s/p 3:45:32 } +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 548/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 2.12279e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:39,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43344 samples/s/p 3:45:48 } +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 550/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 2.1222175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43900 samples/s/p 3:45:31 } +2024-07-25 21:24:45,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 552/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 2.121645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:45,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43686 samples/s/p 3:45:34 } +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 554/ 1625], loss: 0.905, per_step_time: 1470ms, lr: 2.1210728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:48,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43929 samples/s/p 3:45:25 } +2024-07-25 21:24:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 556/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.1204998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:51,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43149 samples/s/p 3:45:41 } +2024-07-25 21:24:53,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 558/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.119927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:53,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.44021 samples/s/p 3:45:17 } +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 560/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.1193544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:56,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.4% |█████████████████████ | 5.43357 samples/s/p 3:45:30 } +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 562/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 2.1187814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:24:59,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43845 samples/s/p 3:45:15 } +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 564/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 2.118208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:02,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43768 samples/s/p 3:45:14 } +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 566/ 1625], loss: 1.114, per_step_time: 1469ms, lr: 2.1176353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:05,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.44254 samples/s/p 3:44:59 } +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 568/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.117062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:08,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43252 samples/s/p 3:45:21 } +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 570/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 2.1164886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:11,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.42868 samples/s/p 3:45:28 } +2024-07-25 21:25:14,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 572/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.1159149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:14,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43229 samples/s/p 3:45:16 } +2024-07-25 21:25:17,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 574/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 2.1153413e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:17,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43589 samples/s/p 3:45:04 } +2024-07-25 21:25:20,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 576/ 1625], loss: 1.275, per_step_time: 1473ms, lr: 2.1147678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.5% |█████████████████████ | 5.43065 samples/s/p 3:45:14 } +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 578/ 1625], loss: 0.930, per_step_time: 1469ms, lr: 2.1141937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:23,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.44468 samples/s/p 3:44:36 } +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 580/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 2.1136198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:26,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43276 samples/s/p 3:45:03 } +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 582/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 2.113046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:29,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42384 samples/s/p 3:45:22 } +2024-07-25 21:25:32,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 584/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.1124719e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:32,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42787 samples/s/p 3:45:09 } +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 586/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.1118974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:35,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43394 samples/s/p 3:44:51 } +2024-07-25 21:25:38,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 588/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1113232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:38,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43703 samples/s/p 3:44:40 } +2024-07-25 21:25:41,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 590/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 2.110749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:41,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.43221 samples/s/p 3:44:49 } +2024-07-25 21:25:44,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 592/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.1101741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:44,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.6% |█████████████████████ | 5.42748 samples/s/p 3:44:58 } +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 594/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 2.1095995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:47,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43623 samples/s/p 3:44:34 } +2024-07-25 21:25:50,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 596/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 2.1090249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:50,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43563 samples/s/p 3:44:32 } +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 598/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 2.1084501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:53,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44036 samples/s/p 3:44:17 } +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 600/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 2.107875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:55,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.44013 samples/s/p 3:44:15 } +2024-07-25 21:25:58,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 602/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 2.1073e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:25:58,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43918 samples/s/p 3:44:14 } +2024-07-25 21:26:01,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 604/ 1625], loss: 1.125, per_step_time: 1474ms, lr: 2.106725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:01,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42721 samples/s/p 3:44:41 } +2024-07-25 21:26:04,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 606/ 1625], loss: 1.317, per_step_time: 1472ms, lr: 2.1061498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:04,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.43148 samples/s/p 3:44:28 } +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 608/ 1625], loss: 1.133, per_step_time: 1474ms, lr: 2.1055741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:07,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.7% |█████████████████████ | 5.42631 samples/s/p 3:44:38 } +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 610/ 1625], loss: 1.201, per_step_time: 1470ms, lr: 2.104999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:10,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44190 samples/s/p 3:43:56 } +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 612/ 1625], loss: 1.081, per_step_time: 1469ms, lr: 2.1044234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:13,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.44322 samples/s/p 3:43:50 } +2024-07-25 21:26:16,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 614/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 2.1038477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:16,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43928 samples/s/p 3:43:57 } +2024-07-25 21:26:19,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 616/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1032718e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:19,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43435 samples/s/p 3:44:06 } +2024-07-25 21:26:22,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 618/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 2.1026959e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:22,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43252 samples/s/p 3:44:07 } +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 620/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 2.1021202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:25,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43373 samples/s/p 3:44:01 } +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 622/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 2.101544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:28,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.43514 samples/s/p 3:43:55 } +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 624/ 1625], loss: 1.141, per_step_time: 1475ms, lr: 2.1009677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:31,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.8% |█████████████████████ | 5.42210 samples/s/p 3:44:24 } +2024-07-25 21:26:34,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 626/ 1625], loss: 1.191, per_step_time: 1474ms, lr: 2.1003914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:34,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.42444 samples/s/p 3:44:16 } +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 628/ 1625], loss: 1.325, per_step_time: 1484ms, lr: 2.0998152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.38932 samples/s/p 3:45:40 } +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 630/ 1625], loss: 0.967, per_step_time: 1469ms, lr: 2.0992386e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:40,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.44316 samples/s/p 3:43:23 } +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 632/ 1625], loss: 1.023, per_step_time: 1470ms, lr: 2.0986621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:43,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43949 samples/s/p 3:43:30 } +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 634/ 1625], loss: 1.285, per_step_time: 1477ms, lr: 2.0980855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.41428 samples/s/p 3:44:29 } +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 636/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.0975087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:49,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43644 samples/s/p 3:43:31 } +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 638/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 2.0969317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:52,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43667 samples/s/p 3:43:28 } +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 640/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 2.0963547e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 43.9% |█████████████████████ | 5.43456 samples/s/p 3:43:30 } +2024-07-25 21:26:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 642/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 2.0957777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:26:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43369 samples/s/p 3:43:29 } +2024-07-25 21:27:00,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 644/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.0952004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:00,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43422 samples/s/p 3:43:25 } +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 646/ 1625], loss: 0.978, per_step_time: 1470ms, lr: 2.094623e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:03,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43950 samples/s/p 3:43:09 } +2024-07-25 21:27:06,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 648/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 2.0940459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:06,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |█████████████████████ | 5.43740 samples/s/p 3:43:11 } +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 650/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 2.0934684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:09,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42965 samples/s/p 3:43:27 } +2024-07-25 21:27:12,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 652/ 1625], loss: 0.972, per_step_time: 1473ms, lr: 2.0928905e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:12,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43033 samples/s/p 3:43:23 } +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 654/ 1625], loss: 1.386, per_step_time: 1470ms, lr: 2.0923131e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.43917 samples/s/p 3:42:58 } +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 656/ 1625], loss: 0.980, per_step_time: 1473ms, lr: 2.0917352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:18,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42890 samples/s/p 3:43:20 } +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 658/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 2.0911573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:21,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.0% |██████████████████████ | 5.42824 samples/s/p 3:43:19 } +2024-07-25 21:27:24,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 660/ 1625], loss: 1.027, per_step_time: 1482ms, lr: 2.0905793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.39450 samples/s/p 3:44:40 } +2024-07-25 21:27:27,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 662/ 1625], loss: 1.356, per_step_time: 1473ms, lr: 2.0900014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:27,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.42897 samples/s/p 3:43:11 } +2024-07-25 21:27:30,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 664/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.0894231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:30,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43823 samples/s/p 3:42:46 } +2024-07-25 21:27:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 666/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 2.0888447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43895 samples/s/p 3:42:41 } +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 668/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.0882664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:36,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43347 samples/s/p 3:42:51 } +2024-07-25 21:27:39,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 670/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 2.087688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:39,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43411 samples/s/p 3:42:47 } +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 672/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0871095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:42,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.44120 samples/s/p 3:42:27 } +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 674/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 2.0865305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:45,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.1% |██████████████████████ | 5.43103 samples/s/p 3:42:49 } +2024-07-25 21:27:48,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 676/ 1625], loss: 0.871, per_step_time: 1471ms, lr: 2.085952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:48,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43589 samples/s/p 3:42:34 } +2024-07-25 21:27:51,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 678/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.085373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:51,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43807 samples/s/p 3:42:25 } +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 680/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 2.0847941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:54,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43333 samples/s/p 3:42:34 } +2024-07-25 21:27:57,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 682/ 1625], loss: 1.056, per_step_time: 1473ms, lr: 2.084215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:57,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.42861 samples/s/p 3:42:43 } +2024-07-25 21:27:59,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 684/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 2.0836358e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:27:59,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43579 samples/s/p 3:42:22 } +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 686/ 1625], loss: 1.146, per_step_time: 1469ms, lr: 2.0830565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.44228 samples/s/p 3:42:03 } +2024-07-25 21:28:05,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 688/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 2.0824771e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:05,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43529 samples/s/p 3:42:18 } +2024-07-25 21:28:08,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 690/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 2.0818976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:08,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.2% |██████████████████████ | 5.43619 samples/s/p 3:42:12 } +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 692/ 1625], loss: 1.278, per_step_time: 1470ms, lr: 2.081318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:11,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43943 samples/s/p 3:42:01 } +2024-07-25 21:28:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 694/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 2.0807383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:14,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44117 samples/s/p 3:41:54 } +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 696/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0801584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:17,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43637 samples/s/p 3:42:03 } +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 698/ 1625], loss: 1.093, per_step_time: 1474ms, lr: 2.0795787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:20,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.42627 samples/s/p 3:42:25 } +2024-07-25 21:28:23,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 700/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 2.0789988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:23,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43332 samples/s/p 3:42:05 } +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 702/ 1625], loss: 0.915, per_step_time: 1472ms, lr: 2.0784188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:26,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43356 samples/s/p 3:42:01 } +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 704/ 1625], loss: 1.225, per_step_time: 1473ms, lr: 2.0778387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:29,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.43100 samples/s/p 3:42:04 } +2024-07-25 21:28:32,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 706/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 2.0772584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:32,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.3% |██████████████████████ | 5.44048 samples/s/p 3:41:38 } +2024-07-25 21:28:35,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 708/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 2.076678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:35,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43688 samples/s/p 3:41:44 } +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 710/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.0760977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:38,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43332 samples/s/p 3:41:50 } +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 712/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 2.075517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:41,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42934 samples/s/p 3:41:57 } +2024-07-25 21:28:44,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 714/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.0749363e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:44,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43150 samples/s/p 3:41:49 } +2024-07-25 21:28:47,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 716/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 2.0743557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:47,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43096 samples/s/p 3:41:47 } +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 718/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 2.0737749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:50,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.42492 samples/s/p 3:41:59 } +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 720/ 1625], loss: 1.335, per_step_time: 1472ms, lr: 2.0731939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:53,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43329 samples/s/p 3:41:35 } +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 722/ 1625], loss: 0.934, per_step_time: 1471ms, lr: 2.0726127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:56,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.4% |██████████████████████ | 5.43655 samples/s/p 3:41:24 } +2024-07-25 21:28:58,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 724/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.0720316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:28:58,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43575 samples/s/p 3:41:23 } +2024-07-25 21:29:01,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 726/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 2.0714504e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:01,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43774 samples/s/p 3:41:16 } +2024-07-25 21:29:04,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 728/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 2.070869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:04,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43094 samples/s/p 3:41:29 } +2024-07-25 21:29:07,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 730/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0702877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:07,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43178 samples/s/p 3:41:24 } +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 732/ 1625], loss: 1.021, per_step_time: 1471ms, lr: 2.0697064e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:10,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43541 samples/s/p 3:41:12 } +2024-07-25 21:29:13,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 734/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.0691246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:13,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.44003 samples/s/p 3:40:58 } +2024-07-25 21:29:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 736/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 2.0685427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:16,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.42808 samples/s/p 3:41:24 } +2024-07-25 21:29:19,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 738/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 2.067961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:19,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.5% |██████████████████████ | 5.43736 samples/s/p 3:40:59 } +2024-07-25 21:29:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 740/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 2.0673793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:22,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43543 samples/s/p 3:41:01 } +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 742/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 2.066797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43284 samples/s/p 3:41:04 } +2024-07-25 21:29:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 744/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 2.0662152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:28,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43078 samples/s/p 3:41:06 } +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 746/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 2.0656329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:31,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.44058 samples/s/p 3:40:39 } +2024-07-25 21:29:34,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 748/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 2.0650506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:34,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43052 samples/s/p 3:41:01 } +2024-07-25 21:29:37,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 750/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 2.0644682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:37,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43954 samples/s/p 3:40:36 } +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 752/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0638858e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:40,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43223 samples/s/p 3:40:51 } +2024-07-25 21:29:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 754/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 2.0633033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:43,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.6% |██████████████████████ | 5.43146 samples/s/p 3:40:50 } +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 756/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 2.0627205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:46,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43848 samples/s/p 3:40:30 } +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 758/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 2.0621379e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:49,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43659 samples/s/p 3:40:31 } +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 760/ 1625], loss: 1.150, per_step_time: 1469ms, lr: 2.061555e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:52,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44220 samples/s/p 3:40:15 } +2024-07-25 21:29:55,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 762/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 2.0609721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43729 samples/s/p 3:40:24 } +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 764/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 2.060389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:29:58,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43938 samples/s/p 3:40:16 } +2024-07-25 21:30:00,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 766/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0598058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43514 samples/s/p 3:40:23 } +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 768/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 2.0592226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:03,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.43963 samples/s/p 3:40:09 } +2024-07-25 21:30:06,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 770/ 1625], loss: 1.113, per_step_time: 1469ms, lr: 2.0586393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:06,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.7% |██████████████████████ | 5.44218 samples/s/p 3:40:00 } +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 772/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 2.0580559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:09,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43013 samples/s/p 3:40:26 } +2024-07-25 21:30:12,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 774/ 1625], loss: 1.265, per_step_time: 1472ms, lr: 2.0574724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:12,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43188 samples/s/p 3:40:19 } +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 776/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 2.056889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:15,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43020 samples/s/p 3:40:20 } +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 778/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 2.0563051e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:18,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43644 samples/s/p 3:40:02 } +2024-07-25 21:30:21,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 780/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0557212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:21,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43695 samples/s/p 3:39:58 } +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 782/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.0551375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:24,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44191 samples/s/p 3:39:43 } +2024-07-25 21:30:27,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 784/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 2.0545536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:27,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43274 samples/s/p 3:40:02 } +2024-07-25 21:30:30,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 786/ 1625], loss: 0.979, per_step_time: 1470ms, lr: 2.0539694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:30,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.44090 samples/s/p 3:39:40 } +2024-07-25 21:30:33,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 788/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 2.0533853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:33,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.8% |██████████████████████ | 5.43982 samples/s/p 3:39:39 } +2024-07-25 21:30:36,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 790/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 2.052801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:36,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43809 samples/s/p 3:39:41 } +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 792/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 2.0522168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:39,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43714 samples/s/p 3:39:40 } +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 794/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 2.0516321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:42,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.42939 samples/s/p 3:39:56 } +2024-07-25 21:30:45,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 796/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 2.0510477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:45,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43930 samples/s/p 3:39:29 } +2024-07-25 21:30:48,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 798/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 2.0504633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:48,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43467 samples/s/p 3:39:37 } +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 800/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0498783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:51,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43832 samples/s/p 3:39:25 } +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 802/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 2.0492935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:54,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.42983 samples/s/p 3:39:43 } +2024-07-25 21:30:57,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 804/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 2.0487088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:57,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 44.9% |██████████████████████ | 5.43261 samples/s/p 3:39:33 } +2024-07-25 21:30:59,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 806/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 2.0481237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:30:59,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43835 samples/s/p 3:39:16 } +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 808/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.0475385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:02,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43324 samples/s/p 3:39:26 } +2024-07-25 21:31:05,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 810/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 2.0469535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:05,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43017 samples/s/p 3:39:30 } +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 812/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 2.0463682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:08,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43164 samples/s/p 3:39:24 } +2024-07-25 21:31:11,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 814/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.0457828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:11,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43623 samples/s/p 3:39:10 } +2024-07-25 21:31:14,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 816/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 2.0451973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:14,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43224 samples/s/p 3:39:17 } +2024-07-25 21:31:17,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 818/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.044612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:17,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43399 samples/s/p 3:39:09 } +2024-07-25 21:31:20,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 820/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 2.0440262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:20,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.0% |██████████████████████ | 5.43830 samples/s/p 3:38:56 } +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 822/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 2.0434405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43255 samples/s/p 3:39:07 } +2024-07-25 21:31:26,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 824/ 1625], loss: 1.036, per_step_time: 1476ms, lr: 2.0428546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.41854 samples/s/p 3:39:38 } +2024-07-25 21:31:29,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 826/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 2.0422689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:29,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43419 samples/s/p 3:38:57 } +2024-07-25 21:31:32,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 828/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 2.0416826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:32,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43255 samples/s/p 3:38:58 } +2024-07-25 21:31:35,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 830/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 2.0410966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:35,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43589 samples/s/p 3:38:47 } +2024-07-25 21:31:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 832/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 2.0405107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.42960 samples/s/p 3:38:59 } +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 834/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 2.0399242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:41,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.44042 samples/s/p 3:38:30 } +2024-07-25 21:31:44,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 836/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.039338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:44,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.1% |██████████████████████ | 5.43564 samples/s/p 3:38:39 } +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 838/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.0387515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:47,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.42838 samples/s/p 3:38:53 } +2024-07-25 21:31:50,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 840/ 1625], loss: 0.995, per_step_time: 1473ms, lr: 2.0381647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:50,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.42979 samples/s/p 3:38:47 } +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 842/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 2.037578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44102 samples/s/p 3:38:17 } +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 844/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 2.0369915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:56,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43345 samples/s/p 3:38:32 } +2024-07-25 21:31:59,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 846/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 2.0364047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:31:59,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.44213 samples/s/p 3:38:08 } +2024-07-25 21:32:01,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 848/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 2.035818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:01,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43139 samples/s/p 3:38:31 } +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 850/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 2.0352309e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:04,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43534 samples/s/p 3:38:19 } +2024-07-25 21:32:07,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 852/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 2.0346435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:07,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.2% |██████████████████████ | 5.43317 samples/s/p 3:38:21 } +2024-07-25 21:32:10,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 854/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 2.0340565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:10,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43507 samples/s/p 3:38:14 } +2024-07-25 21:32:13,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 856/ 1625], loss: 1.208, per_step_time: 1470ms, lr: 2.0334694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:13,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43882 samples/s/p 3:38:02 } +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 858/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 2.032882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:16,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43873 samples/s/p 3:37:59 } +2024-07-25 21:32:19,659 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 860/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.0322945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:19,659 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43152 samples/s/p 3:38:13 } +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 862/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 2.031707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:22,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43439 samples/s/p 3:38:04 } +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 864/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 2.0311192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:25,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43631 samples/s/p 3:37:56 } +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 866/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 2.0305315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:28,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43259 samples/s/p 3:38:02 } +2024-07-25 21:32:31,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 868/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 2.0299438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:31,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.3% |██████████████████████ | 5.43172 samples/s/p 3:38:01 } +2024-07-25 21:32:34,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 870/ 1625], loss: 1.496, per_step_time: 1473ms, lr: 2.0293563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:34,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43091 samples/s/p 3:38:00 } +2024-07-25 21:32:37,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 872/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 2.0287682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:37,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43788 samples/s/p 3:37:40 } +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 874/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 2.0281801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:40,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.42889 samples/s/p 3:37:59 } +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 876/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 2.0275918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:43,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44413 samples/s/p 3:37:20 } +2024-07-25 21:32:46,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 878/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.0270036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:46,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43498 samples/s/p 3:37:39 } +2024-07-25 21:32:49,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 880/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.0264153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:49,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43726 samples/s/p 3:37:30 } +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 882/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 2.0258269e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.44341 samples/s/p 3:37:13 } +2024-07-25 21:32:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 884/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 2.0252384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:55,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.4% |██████████████████████ | 5.43739 samples/s/p 3:37:24 } +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 886/ 1625], loss: 1.130, per_step_time: 1474ms, lr: 2.0246498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:32:58,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.42633 samples/s/p 3:37:48 } +2024-07-25 21:33:00,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 888/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 2.0240614e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:00,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43390 samples/s/p 3:37:26 } +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 890/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 2.0234722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:03,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43248 samples/s/p 3:37:27 } +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 892/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 2.0228836e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:06,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43514 samples/s/p 3:37:18 } +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 894/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 2.0222948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:09,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43767 samples/s/p 3:37:09 } +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 896/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.0217056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:12,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43477 samples/s/p 3:37:13 } +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 898/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 2.0211166e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:15,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43840 samples/s/p 3:37:01 } +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 900/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 2.0205272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:18,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.5% |██████████████████████ | 5.43617 samples/s/p 3:37:03 } +2024-07-25 21:33:21,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 902/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.019938e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:21,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43434 samples/s/p 3:37:05 } +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 904/ 1625], loss: 1.084, per_step_time: 1472ms, lr: 2.0193487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:24,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43468 samples/s/p 3:37:01 } +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 906/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 2.0187592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:27,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43475 samples/s/p 3:36:58 } +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 908/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 2.0181697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:30,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.42698 samples/s/p 3:37:14 } +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 910/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 2.0175801e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:33,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43755 samples/s/p 3:36:45 } +2024-07-25 21:33:36,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 912/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0169902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:36,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43498 samples/s/p 3:36:49 } +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 914/ 1625], loss: 1.225, per_step_time: 1470ms, lr: 2.0164005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:39,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43931 samples/s/p 3:36:35 } +2024-07-25 21:33:42,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 916/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 2.0158106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:42,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43351 samples/s/p 3:36:46 } +2024-07-25 21:33:45,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 918/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.0152207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:45,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.6% |██████████████████████ | 5.43423 samples/s/p 3:36:42 } +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 920/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 2.0146306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:48,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43712 samples/s/p 3:36:32 } +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 922/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0140405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:51,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43490 samples/s/p 3:36:34 } +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 924/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.0134501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42926 samples/s/p 3:36:45 } +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 926/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.0128598e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:57,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43204 samples/s/p 3:36:35 } +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 928/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0122696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:33:59,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43282 samples/s/p 3:36:30 } +2024-07-25 21:34:02,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 930/ 1625], loss: 1.146, per_step_time: 1474ms, lr: 2.011679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:02,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.42505 samples/s/p 3:36:46 } +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 932/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 2.0110887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:05,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43690 samples/s/p 3:36:15 } +2024-07-25 21:34:08,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 934/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.0104979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:08,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.7% |██████████████████████ | 5.43392 samples/s/p 3:36:19 } +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 936/ 1625], loss: 1.020, per_step_time: 1472ms, lr: 2.009907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:11,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43404 samples/s/p 3:36:15 } +2024-07-25 21:34:14,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 938/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.0093163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:14,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43608 samples/s/p 3:36:08 } +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 940/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 2.0087255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:17,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43702 samples/s/p 3:36:02 } +2024-07-25 21:34:20,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 942/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 2.0081343e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:20,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43391 samples/s/p 3:36:07 } +2024-07-25 21:34:23,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 944/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 2.0075433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:23,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43450 samples/s/p 3:36:03 } +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 946/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 2.0069521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:26,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43708 samples/s/p 3:35:54 } +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 948/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.0063608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:29,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43251 samples/s/p 3:36:01 } +2024-07-25 21:34:32,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 950/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 2.0057694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:32,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.8% |██████████████████████ | 5.43531 samples/s/p 3:35:52 } +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 952/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 2.005178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:35,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.42975 samples/s/p 3:36:02 } +2024-07-25 21:34:38,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 954/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.0045867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:38,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43459 samples/s/p 3:35:48 } +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 956/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 2.003995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:41,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43063 samples/s/p 3:35:54 } +2024-07-25 21:34:44,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 958/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.0034033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:44,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43535 samples/s/p 3:35:40 } +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 960/ 1625], loss: 1.185, per_step_time: 1469ms, lr: 2.0028117e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:47,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.44313 samples/s/p 3:35:19 } +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 962/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 2.0022198e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:50,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43804 samples/s/p 3:35:28 } +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 964/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0016278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:53,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43471 samples/s/p 3:35:33 } +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 966/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 2.0010359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:56,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 45.9% |██████████████████████ | 5.43362 samples/s/p 3:35:32 } +2024-07-25 21:34:59,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 968/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.0004436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:34:59,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43609 samples/s/p 3:35:24 } +2024-07-25 21:35:01,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 970/ 1625], loss: 1.516, per_step_time: 1472ms, lr: 1.9998517e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:01,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43150 samples/s/p 3:35:31 } +2024-07-25 21:35:04,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 972/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.9992593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:04,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43081 samples/s/p 3:35:30 } +2024-07-25 21:35:07,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 974/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.998667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:07,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |██████████████████████ | 5.43158 samples/s/p 3:35:25 } +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 976/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.9980747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:10,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43570 samples/s/p 3:35:13 } +2024-07-25 21:35:13,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 978/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.997482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:13,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43575 samples/s/p 3:35:10 } +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 980/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 1.9968895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:16,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.42921 samples/s/p 3:35:22 } +2024-07-25 21:35:19,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 982/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.9962969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:19,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.0% |███████████████████████ | 5.43647 samples/s/p 3:35:02 } +2024-07-25 21:35:22,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 984/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 1.9957042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:22,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43222 samples/s/p 3:35:09 } +2024-07-25 21:35:25,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 986/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.995111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:25,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42875 samples/s/p 3:35:14 } +2024-07-25 21:35:28,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 988/ 1625], loss: 1.168, per_step_time: 1475ms, lr: 1.9945184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:28,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42221 samples/s/p 3:35:27 } +2024-07-25 21:35:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 990/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.9939254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.42729 samples/s/p 3:35:12 } +2024-07-25 21:35:34,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 992/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 1.9933323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:34,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43220 samples/s/p 3:34:57 } +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 994/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.992739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:37,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43286 samples/s/p 3:34:53 } +2024-07-25 21:35:40,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 996/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.992146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:40,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43886 samples/s/p 3:34:36 } +2024-07-25 21:35:43,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 998/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.9915527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:43,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.1% |███████████████████████ | 5.43653 samples/s/p 3:34:38 } +2024-07-25 21:35:46,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1000/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.9909592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:46,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44155 samples/s/p 3:34:23 } +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1002/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9903657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:49,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44078 samples/s/p 3:34:22 } +2024-07-25 21:35:52,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1004/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.9897721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:52,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43413 samples/s/p 3:34:35 } +2024-07-25 21:35:55,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1006/ 1625], loss: 1.312, per_step_time: 1470ms, lr: 1.9891784e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:55,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.44028 samples/s/p 3:34:18 } +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1008/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.9885845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:35:58,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43296 samples/s/p 3:34:32 } +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1010/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.987991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:00,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43876 samples/s/p 3:34:15 } +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1012/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.987397e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:03,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43221 samples/s/p 3:34:28 } +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1014/ 1625], loss: 1.076, per_step_time: 1472ms, lr: 1.9868032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:06,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.2% |███████████████████████ | 5.43270 samples/s/p 3:34:24 } +2024-07-25 21:36:09,854 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1016/ 1625], loss: 1.047, per_step_time: 1474ms, lr: 1.986209e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:09,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.42638 samples/s/p 3:34:36 } +2024-07-25 21:36:12,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1018/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.9856148e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:12,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43316 samples/s/p 3:34:17 } +2024-07-25 21:36:15,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1020/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 1.9850208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:15,759 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43162 samples/s/p 3:34:18 } +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1022/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.9844263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:18,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43188 samples/s/p 3:34:14 } +2024-07-25 21:36:21,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1024/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.9838319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:21,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43227 samples/s/p 3:34:10 } +2024-07-25 21:36:24,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1026/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9832376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:24,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43652 samples/s/p 3:33:57 } +2024-07-25 21:36:27,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1028/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 1.982643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:27,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43088 samples/s/p 3:34:08 } +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1030/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.9820483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:30,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.3% |███████████████████████ | 5.43234 samples/s/p 3:34:01 } +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1032/ 1625], loss: 1.327, per_step_time: 1472ms, lr: 1.9814537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:33,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43255 samples/s/p 3:33:58 } +2024-07-25 21:36:36,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1034/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.980859e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:36,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43733 samples/s/p 3:33:43 } +2024-07-25 21:36:39,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1036/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 1.9802641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:39,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43297 samples/s/p 3:33:51 } +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1038/ 1625], loss: 1.288, per_step_time: 1470ms, lr: 1.9796691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:42,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43991 samples/s/p 3:33:31 } +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1040/ 1625], loss: 1.038, per_step_time: 1473ms, lr: 1.9790741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:45,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43091 samples/s/p 3:33:50 } +2024-07-25 21:36:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1042/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.978479e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:48,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43784 samples/s/p 3:33:30 } +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1044/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.977884e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:51,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43873 samples/s/p 3:33:25 } +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1046/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.9772886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:54,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43505 samples/s/p 3:33:31 } +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1048/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.9766934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:36:57,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.4% |███████████████████████ | 5.43830 samples/s/p 3:33:21 } +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1050/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.9760979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:00,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43728 samples/s/p 3:33:20 } +2024-07-25 21:37:02,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1052/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.9755025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:02,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.42971 samples/s/p 3:33:35 } +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1054/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 1.974907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:05,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43531 samples/s/p 3:33:19 } +2024-07-25 21:37:08,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1056/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.9743113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:08,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43277 samples/s/p 3:33:22 } +2024-07-25 21:37:11,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1058/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.9737156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:11,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43300 samples/s/p 3:33:18 } +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1060/ 1625], loss: 1.250, per_step_time: 1481ms, lr: 1.9731197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:14,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.40098 samples/s/p 3:34:31 } +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1062/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.972524e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:17,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.43403 samples/s/p 3:33:10 } +2024-07-25 21:37:20,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1064/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.9719278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:20,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.5% |███████████████████████ | 5.42808 samples/s/p 3:33:21 } +2024-07-25 21:37:23,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1066/ 1625], loss: 1.407, per_step_time: 1471ms, lr: 1.971332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:23,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43598 samples/s/p 3:33:00 } +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1068/ 1625], loss: 0.973, per_step_time: 1472ms, lr: 1.9707357e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:26,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43339 samples/s/p 3:33:03 } +2024-07-25 21:37:29,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1070/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 1.9701396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:29,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.42804 samples/s/p 3:33:12 } +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1072/ 1625], loss: 1.250, per_step_time: 1470ms, lr: 1.9695433e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:32,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43918 samples/s/p 3:32:43 } +2024-07-25 21:37:35,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1074/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.968947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:35,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43700 samples/s/p 3:32:45 } +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1076/ 1625], loss: 1.285, per_step_time: 1472ms, lr: 1.9683506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:38,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43405 samples/s/p 3:32:49 } +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1078/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.967754e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:41,366 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43130 samples/s/p 3:32:53 } +2024-07-25 21:37:44,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1080/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.9671574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:44,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.6% |███████████████████████ | 5.43710 samples/s/p 3:32:36 } +2024-07-25 21:37:47,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1082/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.966561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:47,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43822 samples/s/p 3:32:31 } +2024-07-25 21:37:50,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1084/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.9659641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:50,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43294 samples/s/p 3:32:40 } +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1086/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.9653671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:53,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43556 samples/s/p 3:32:31 } +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1088/ 1625], loss: 0.941, per_step_time: 1472ms, lr: 1.9647705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:56,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43287 samples/s/p 3:32:34 } +2024-07-25 21:37:59,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1090/ 1625], loss: 1.373, per_step_time: 1472ms, lr: 1.9641735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:37:59,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43459 samples/s/p 3:32:27 } +2024-07-25 21:38:02,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1092/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.9635765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:02,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43847 samples/s/p 3:32:15 } +2024-07-25 21:38:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1094/ 1625], loss: 0.972, per_step_time: 1471ms, lr: 1.9629793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43765 samples/s/p 3:32:14 } +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1096/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.9623822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.7% |███████████████████████ | 5.43537 samples/s/p 3:32:17 } +2024-07-25 21:38:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1098/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.961785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43417 samples/s/p 3:32:17 } +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1100/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.9611876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:13,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.42894 samples/s/p 3:32:26 } +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1102/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.9605903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:16,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43499 samples/s/p 3:32:09 } +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1104/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.9599927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:19,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43858 samples/s/p 3:31:58 } +2024-07-25 21:38:22,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1106/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.9593952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43302 samples/s/p 3:32:08 } +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1108/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 1.9587973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:25,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.44216 samples/s/p 3:31:43 } +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1110/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 1.9581998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:28,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.43693 samples/s/p 3:31:53 } +2024-07-25 21:38:31,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1112/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 1.9576019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:31,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.8% |███████████████████████ | 5.42985 samples/s/p 3:32:06 } +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1114/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.957004e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:34,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42851 samples/s/p 3:32:06 } +2024-07-25 21:38:37,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1116/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.956406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:37,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43567 samples/s/p 3:31:47 } +2024-07-25 21:38:40,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1118/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.955808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:40,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43625 samples/s/p 3:31:42 } +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1120/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.95521e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:43,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42970 samples/s/p 3:31:55 } +2024-07-25 21:38:46,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1122/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.954612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:46,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43622 samples/s/p 3:31:37 } +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1124/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.9540135e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43128 samples/s/p 3:31:45 } +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1126/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 1.9534153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:52,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.42930 samples/s/p 3:31:47 } +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1128/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.9528168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:55,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 46.9% |███████████████████████ | 5.43043 samples/s/p 3:31:41 } +2024-07-25 21:38:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1130/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 1.9522184e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:38:58,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43987 samples/s/p 3:31:16 } +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1132/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.95162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:01,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43444 samples/s/p 3:31:26 } +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1134/ 1625], loss: 1.303, per_step_time: 1470ms, lr: 1.9510213e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:03,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43933 samples/s/p 3:31:12 } +2024-07-25 21:39:06,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1136/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.9504225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:06,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43548 samples/s/p 3:31:18 } +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1138/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9498239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:09,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43538 samples/s/p 3:31:15 } +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1140/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.949225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:12,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43562 samples/s/p 3:31:11 } +2024-07-25 21:39:15,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1142/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.948626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:15,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43721 samples/s/p 3:31:05 } +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1144/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.948027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:18,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.0% |███████████████████████ | 5.43157 samples/s/p 3:31:15 } +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1146/ 1625], loss: 1.294, per_step_time: 1471ms, lr: 1.947428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:21,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43711 samples/s/p 3:30:59 } +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1148/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.9468289e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:24,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.42887 samples/s/p 3:31:15 } +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1150/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.9462297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:27,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43503 samples/s/p 3:30:58 } +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1152/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.9456304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:30,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43490 samples/s/p 3:30:55 } +2024-07-25 21:39:33,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1154/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.9450312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:33,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43759 samples/s/p 3:30:46 } +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1156/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.9444315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:36,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43540 samples/s/p 3:30:48 } +2024-07-25 21:39:39,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1158/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.9438321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43816 samples/s/p 3:30:39 } +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1160/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.9432326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:42,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.1% |███████████████████████ | 5.43915 samples/s/p 3:30:34 } +2024-07-25 21:39:45,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1162/ 1625], loss: 1.066, per_step_time: 1469ms, lr: 1.942633e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:45,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.44232 samples/s/p 3:30:24 } +2024-07-25 21:39:48,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1164/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 1.942033e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43004 samples/s/p 3:30:49 } +2024-07-25 21:39:51,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1166/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.9414336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:51,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43806 samples/s/p 3:30:28 } +2024-07-25 21:39:54,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1168/ 1625], loss: 1.320, per_step_time: 1470ms, lr: 1.9408335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:54,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43956 samples/s/p 3:30:21 } +2024-07-25 21:39:57,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1170/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.9402336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:39:57,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43450 samples/s/p 3:30:30 } +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1172/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 1.9396337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:00,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.42957 samples/s/p 3:30:38 } +2024-07-25 21:40:03,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1174/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 1.9390336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:03,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43076 samples/s/p 3:30:33 } +2024-07-25 21:40:05,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1176/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 1.9384335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:05,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.43689 samples/s/p 3:30:16 } +2024-07-25 21:40:08,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1178/ 1625], loss: 1.039, per_step_time: 1474ms, lr: 1.9378333e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:08,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.2% |███████████████████████ | 5.42581 samples/s/p 3:30:38 } +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1180/ 1625], loss: 1.450, per_step_time: 1471ms, lr: 1.9372328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:11,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43534 samples/s/p 3:30:13 } +2024-07-25 21:40:14,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1182/ 1625], loss: 1.337, per_step_time: 1470ms, lr: 1.9366327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:14,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43855 samples/s/p 3:30:03 } +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1184/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 1.9360323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:17,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43433 samples/s/p 3:30:10 } +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1186/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.9354316e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43812 samples/s/p 3:29:58 } +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1188/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 1.934831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:23,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.44394 samples/s/p 3:29:42 } +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1190/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.9342304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:26,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43477 samples/s/p 3:30:00 } +2024-07-25 21:40:29,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1192/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.9336298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:29,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43715 samples/s/p 3:29:51 } +2024-07-25 21:40:32,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1194/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.933029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:32,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.3% |███████████████████████ | 5.43293 samples/s/p 3:29:58 } +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1196/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.9324281e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:35,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43084 samples/s/p 3:30:00 } +2024-07-25 21:40:38,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1198/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.9318273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:38,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43361 samples/s/p 3:29:51 } +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1200/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.9312261e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:41,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43203 samples/s/p 3:29:51 } +2024-07-25 21:40:44,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1202/ 1625], loss: 1.060, per_step_time: 1470ms, lr: 1.930625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:44,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43920 samples/s/p 3:29:32 } +2024-07-25 21:40:47,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1204/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.930024e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.42892 samples/s/p 3:29:53 } +2024-07-25 21:40:50,220 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1206/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.9294228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:50,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44211 samples/s/p 3:29:19 } +2024-07-25 21:40:53,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1208/ 1625], loss: 0.975, per_step_time: 1469ms, lr: 1.9288214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:53,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.44225 samples/s/p 3:29:16 } +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1210/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.92822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:56,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.4% |███████████████████████ | 5.43491 samples/s/p 3:29:30 } +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1212/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.9276187e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:40:59,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44089 samples/s/p 3:29:13 } +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1214/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.9270172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:02,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43411 samples/s/p 3:29:26 } +2024-07-25 21:41:04,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1216/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.9264156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43352 samples/s/p 3:29:24 } +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1218/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.925814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:07,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43529 samples/s/p 3:29:17 } +2024-07-25 21:41:10,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1220/ 1625], loss: 1.007, per_step_time: 1473ms, lr: 1.9252126e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:10,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43096 samples/s/p 3:29:24 } +2024-07-25 21:41:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1222/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9246108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:13,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43674 samples/s/p 3:29:08 } +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1224/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.9240086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:16,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.43788 samples/s/p 3:29:03 } +2024-07-25 21:41:19,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1226/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.9234069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:19,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.5% |███████████████████████ | 5.44275 samples/s/p 3:28:48 } +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1228/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.922805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:22,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43505 samples/s/p 3:29:03 } +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1230/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.9222029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:25,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.44101 samples/s/p 3:28:47 } +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1232/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.9216008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:28,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43740 samples/s/p 3:28:52 } +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1234/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.9209985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:31,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43562 samples/s/p 3:28:53 } +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1236/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.9203962e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:34,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43712 samples/s/p 3:28:47 } +2024-07-25 21:41:37,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1238/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.919794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:37,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43810 samples/s/p 3:28:42 } +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1240/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.9191915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:40,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43353 samples/s/p 3:28:49 } +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1242/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.918589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:43,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.6% |███████████████████████ | 5.43427 samples/s/p 3:28:44 } +2024-07-25 21:41:46,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1244/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9179866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:46,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.44142 samples/s/p 3:28:25 } +2024-07-25 21:41:49,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1246/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 1.917384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:49,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43524 samples/s/p 3:28:36 } +2024-07-25 21:41:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1248/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 1.9167815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43068 samples/s/p 3:28:44 } +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1250/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.9161786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:55,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43950 samples/s/p 3:28:21 } +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1252/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.915576e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:41:58,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43061 samples/s/p 3:28:38 } +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1254/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.914973e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:01,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43663 samples/s/p 3:28:21 } +2024-07-25 21:42:03,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1256/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.9143701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:03,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43049 samples/s/p 3:28:33 } +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1258/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.913767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:06,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.7% |███████████████████████ | 5.43758 samples/s/p 3:28:13 } +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1260/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.9131641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:09,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44139 samples/s/p 3:28:02 } +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1262/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.9125608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:12,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.44053 samples/s/p 3:28:01 } +2024-07-25 21:42:15,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1264/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.9119578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:15,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.42811 samples/s/p 3:28:26 } +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1266/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.9113546e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:18,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43580 samples/s/p 3:28:06 } +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1268/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.910751e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:21,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43940 samples/s/p 3:27:54 } +2024-07-25 21:42:24,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1270/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.9101477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:24,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43554 samples/s/p 3:28:00 } +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1272/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 1.9095443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:27,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43631 samples/s/p 3:27:56 } +2024-07-25 21:42:30,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1274/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 1.9089408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:30,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.8% |███████████████████████ | 5.43381 samples/s/p 3:27:58 } +2024-07-25 21:42:33,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1276/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.908337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:33,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43634 samples/s/p 3:27:50 } +2024-07-25 21:42:36,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1278/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.9077335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:36,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42925 samples/s/p 3:28:03 } +2024-07-25 21:42:39,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1280/ 1625], loss: 0.998, per_step_time: 1473ms, lr: 1.9071298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:39,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.42899 samples/s/p 3:28:01 } +2024-07-25 21:42:42,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1282/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.9065259e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:42,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43697 samples/s/p 3:27:39 } +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1284/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.9059222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:45,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43492 samples/s/p 3:27:41 } +2024-07-25 21:42:48,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1286/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.9053183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:48,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.44157 samples/s/p 3:27:23 } +2024-07-25 21:42:51,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1288/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 1.9047144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:51,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43686 samples/s/p 3:27:31 } +2024-07-25 21:42:54,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1290/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9041101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:54,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 47.9% |███████████████████████ | 5.43826 samples/s/p 3:27:25 } +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1292/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9035058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:42:57,082 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43510 samples/s/p 3:27:29 } +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1294/ 1625], loss: 1.284, per_step_time: 1474ms, lr: 1.902902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:00,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.42687 samples/s/p 3:27:45 } +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1296/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.9022977e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:02,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43849 samples/s/p 3:27:15 } +2024-07-25 21:43:05,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1298/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 1.9016934e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:05,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |███████████████████████ | 5.43721 samples/s/p 3:27:15 } +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1300/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.901089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:08,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43492 samples/s/p 3:27:18 } +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1302/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.9004845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:11,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.42980 samples/s/p 3:27:26 } +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1304/ 1625], loss: 1.236, per_step_time: 1473ms, lr: 1.8998799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:14,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43048 samples/s/p 3:27:22 } +2024-07-25 21:43:17,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1306/ 1625], loss: 1.195, per_step_time: 1470ms, lr: 1.8992752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:17,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.44149 samples/s/p 3:26:54 } +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1308/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.8986706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:20,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.0% |████████████████████████ | 5.43266 samples/s/p 3:27:11 } +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1310/ 1625], loss: 1.085, per_step_time: 1473ms, lr: 1.8980661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:23,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42868 samples/s/p 3:27:17 } +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1312/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.8974612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:26,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43686 samples/s/p 3:26:55 } +2024-07-25 21:43:29,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1314/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.8968563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:29,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43597 samples/s/p 3:26:55 } +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1316/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8962515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:32,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42819 samples/s/p 3:27:09 } +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1318/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.8956465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:35,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43688 samples/s/p 3:26:47 } +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1320/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.8950414e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:38,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42982 samples/s/p 3:27:00 } +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1322/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.8944364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:41,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.43307 samples/s/p 3:26:49 } +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1324/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.8938314e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:44,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.1% |████████████████████████ | 5.42891 samples/s/p 3:26:56 } +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1326/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.8932262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:47,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42952 samples/s/p 3:26:52 } +2024-07-25 21:43:50,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1328/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.8926208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:50,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43174 samples/s/p 3:26:44 } +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.8920155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:53,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44182 samples/s/p 3:26:18 } +2024-07-25 21:43:56,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1332/ 1625], loss: 1.164, per_step_time: 1474ms, lr: 1.8914103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:56,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.42729 samples/s/p 3:26:48 } +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1334/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.8908046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:43:59,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.44116 samples/s/p 3:26:13 } +2024-07-25 21:44:02,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1336/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 1.890199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:02,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43869 samples/s/p 3:26:16 } +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1338/ 1625], loss: 1.290, per_step_time: 1472ms, lr: 1.8895937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:04,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43365 samples/s/p 3:26:25 } +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1340/ 1625], loss: 1.136, per_step_time: 1473ms, lr: 1.888988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:07,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.2% |████████████████████████ | 5.43089 samples/s/p 3:26:28 } +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1342/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.888382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:10,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43856 samples/s/p 3:26:07 } +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1344/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.8877763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:13,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43296 samples/s/p 3:26:17 } +2024-07-25 21:44:16,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1346/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.8871706e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:16,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43357 samples/s/p 3:26:13 } +2024-07-25 21:44:19,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1348/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.8865647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:19,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43046 samples/s/p 3:26:17 } +2024-07-25 21:44:22,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1350/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.8859586e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:22,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43614 samples/s/p 3:26:01 } +2024-07-25 21:44:25,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1352/ 1625], loss: 1.028, per_step_time: 1474ms, lr: 1.8853527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:25,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.42510 samples/s/p 3:26:23 } +2024-07-25 21:44:28,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1354/ 1625], loss: 0.906, per_step_time: 1473ms, lr: 1.8847466e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:28,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43034 samples/s/p 3:26:09 } +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1356/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.8841405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.3% |████████████████████████ | 5.43281 samples/s/p 3:26:00 } +2024-07-25 21:44:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1358/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.883534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43367 samples/s/p 3:25:55 } +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1360/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.882928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43394 samples/s/p 3:25:51 } +2024-07-25 21:44:40,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1362/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.8823217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:40,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43517 samples/s/p 3:25:46 } +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1364/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.8817153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43522 samples/s/p 3:25:43 } +2024-07-25 21:44:46,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1366/ 1625], loss: 1.177, per_step_time: 1473ms, lr: 1.8811088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:46,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.42832 samples/s/p 3:25:55 } +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1368/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.8805022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:49,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43312 samples/s/p 3:25:42 } +2024-07-25 21:44:52,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1370/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.8798957e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:52,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.43935 samples/s/p 3:25:25 } +2024-07-25 21:44:55,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1372/ 1625], loss: 1.286, per_step_time: 1469ms, lr: 1.8792889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:55,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.4% |████████████████████████ | 5.44219 samples/s/p 3:25:15 } +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1374/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.8786823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:44:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43508 samples/s/p 3:25:28 } +2024-07-25 21:45:01,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1376/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.8780756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:01,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43016 samples/s/p 3:25:37 } +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1378/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 1.8774688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:03,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43831 samples/s/p 3:25:15 } +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1380/ 1625], loss: 1.317, per_step_time: 1471ms, lr: 1.8768616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:06,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43652 samples/s/p 3:25:16 } +2024-07-25 21:45:09,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1382/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 1.876255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:09,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43467 samples/s/p 3:25:17 } +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1384/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.875648e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:12,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43774 samples/s/p 3:25:08 } +2024-07-25 21:45:15,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1386/ 1625], loss: 1.354, per_step_time: 1472ms, lr: 1.8750408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:15,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43236 samples/s/p 3:25:17 } +2024-07-25 21:45:18,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1388/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.8744337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:18,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.5% |████████████████████████ | 5.43269 samples/s/p 3:25:13 } +2024-07-25 21:45:21,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1390/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8738265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:21,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43303 samples/s/p 3:25:09 } +2024-07-25 21:45:24,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1392/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.8732191e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:24,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43262 samples/s/p 3:25:07 } +2024-07-25 21:45:27,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1394/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.872612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:27,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43844 samples/s/p 3:24:51 } +2024-07-25 21:45:30,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1396/ 1625], loss: 1.383, per_step_time: 1473ms, lr: 1.8720046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:30,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43058 samples/s/p 3:25:06 } +2024-07-25 21:45:33,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1398/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.8713974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:33,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43213 samples/s/p 3:25:00 } +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1400/ 1625], loss: 1.313, per_step_time: 1473ms, lr: 1.8707897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:36,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43085 samples/s/p 3:25:00 } +2024-07-25 21:45:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1402/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.870182e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:39,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.43405 samples/s/p 3:24:49 } +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1404/ 1625], loss: 0.955, per_step_time: 1470ms, lr: 1.8695746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:42,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.6% |████████████████████████ | 5.44004 samples/s/p 3:24:33 } +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1406/ 1625], loss: 1.150, per_step_time: 1473ms, lr: 1.8689669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.42932 samples/s/p 3:24:54 } +2024-07-25 21:45:48,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1408/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.8683593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:48,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43279 samples/s/p 3:24:43 } +2024-07-25 21:45:51,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1410/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.8677512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:51,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43884 samples/s/p 3:24:27 } +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.8671435e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:54,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43445 samples/s/p 3:24:34 } +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1414/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.8665356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:45:57,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43285 samples/s/p 3:24:34 } +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1416/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.8659277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:00,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43639 samples/s/p 3:24:24 } +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1418/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.8653196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:03,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43075 samples/s/p 3:24:33 } +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1420/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.8647115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:05,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.7% |████████████████████████ | 5.43665 samples/s/p 3:24:17 } +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1422/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.8641036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:08,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43090 samples/s/p 3:24:27 } +2024-07-25 21:46:11,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1424/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8634952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:11,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43708 samples/s/p 3:24:10 } +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1426/ 1625], loss: 0.986, per_step_time: 1473ms, lr: 1.862887e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:14,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42848 samples/s/p 3:24:27 } +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1428/ 1625], loss: 1.176, per_step_time: 1474ms, lr: 1.8622788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:17,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42537 samples/s/p 3:24:31 } +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1430/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.8616704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:20,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43212 samples/s/p 3:24:13 } +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1432/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.861062e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:23,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43561 samples/s/p 3:24:02 } +2024-07-25 21:46:26,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1434/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.8604534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:26,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43542 samples/s/p 3:23:59 } +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1436/ 1625], loss: 0.952, per_step_time: 1473ms, lr: 1.859845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:29,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.42991 samples/s/p 3:24:09 } +2024-07-25 21:46:32,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1438/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 1.8592364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:32,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.8% |████████████████████████ | 5.43081 samples/s/p 3:24:04 } +2024-07-25 21:46:35,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1440/ 1625], loss: 1.313, per_step_time: 1472ms, lr: 1.8586277e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:35,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43208 samples/s/p 3:23:58 } +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1442/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.858019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:38,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43762 samples/s/p 3:23:42 } +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1444/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.8574103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:41,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43284 samples/s/p 3:23:50 } +2024-07-25 21:46:44,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1446/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.8568015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:44,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.44077 samples/s/p 3:23:30 } +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1448/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 1.8561926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:47,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43979 samples/s/p 3:23:29 } +2024-07-25 21:46:50,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1450/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.8555837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:50,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43328 samples/s/p 3:23:40 } +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1452/ 1625], loss: 1.312, per_step_time: 1472ms, lr: 1.8549747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:53,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43358 samples/s/p 3:23:37 } +2024-07-25 21:46:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1454/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8543657e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 48.9% |████████████████████████ | 5.43917 samples/s/p 3:23:21 } +2024-07-25 21:46:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1456/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.8537567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:46:59,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43297 samples/s/p 3:23:32 } +2024-07-25 21:47:02,053 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1458/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.8531473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:02,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43404 samples/s/p 3:23:27 } +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1460/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.8525381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:05,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43799 samples/s/p 3:23:15 } +2024-07-25 21:47:07,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1462/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.8519288e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:07,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43732 samples/s/p 3:23:14 } +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1464/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.8513196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:10,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43643 samples/s/p 3:23:13 } +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1466/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.8507104e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43652 samples/s/p 3:23:10 } +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1468/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.8501007e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:16,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.44402 samples/s/p 3:22:50 } +2024-07-25 21:47:19,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1470/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.8494913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:19,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.0% |████████████████████████ | 5.43770 samples/s/p 3:23:01 } +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1472/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.8488818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:22,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43161 samples/s/p 3:23:12 } +2024-07-25 21:47:25,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1474/ 1625], loss: 1.323, per_step_time: 1469ms, lr: 1.848272e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:25,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44262 samples/s/p 3:22:44 } +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1476/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.8476625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:28,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43176 samples/s/p 3:23:06 } +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1478/ 1625], loss: 1.269, per_step_time: 1473ms, lr: 1.8470528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:31,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.42970 samples/s/p 3:23:07 } +2024-07-25 21:47:34,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1480/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 1.846443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:34,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.42966 samples/s/p 3:23:04 } +2024-07-25 21:47:37,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1482/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 1.8458331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:37,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.44193 samples/s/p 3:22:34 } +2024-07-25 21:47:40,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1484/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.8452232e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:40,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43617 samples/s/p 3:22:44 } +2024-07-25 21:47:43,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1486/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.8446133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:43,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.1% |████████████████████████ | 5.43166 samples/s/p 3:22:51 } +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1488/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 1.8440034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:46,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43519 samples/s/p 3:22:40 } +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1490/ 1625], loss: 1.207, per_step_time: 1474ms, lr: 1.8433933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:49,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.42739 samples/s/p 3:22:55 } +2024-07-25 21:47:52,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1492/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.8427832e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:52,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43735 samples/s/p 3:22:30 } +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1494/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.8421732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:55,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43698 samples/s/p 3:22:27 } +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1496/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.841563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:47:58,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43825 samples/s/p 3:22:22 } +2024-07-25 21:48:01,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1498/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.8409528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:01,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43799 samples/s/p 3:22:19 } +2024-07-25 21:48:04,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1500/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.8403425e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:04,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43438 samples/s/p 3:22:24 } +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1502/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.839732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:06,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.2% |████████████████████████ | 5.43438 samples/s/p 3:22:21 } +2024-07-25 21:48:09,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1504/ 1625], loss: 1.385, per_step_time: 1473ms, lr: 1.8391216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:09,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.42979 samples/s/p 3:22:29 } +2024-07-25 21:48:12,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1506/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 1.8385112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:12,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44142 samples/s/p 3:22:00 } +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1508/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.8379005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:15,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43581 samples/s/p 3:22:09 } +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1510/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.8372903e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:18,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43893 samples/s/p 3:22:00 } +2024-07-25 21:48:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1512/ 1625], loss: 1.319, per_step_time: 1472ms, lr: 1.8366794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43304 samples/s/p 3:22:10 } +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.8360686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:24,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43113 samples/s/p 3:22:11 } +2024-07-25 21:48:27,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1516/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 1.8354582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:27,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.44107 samples/s/p 3:21:46 } +2024-07-25 21:48:30,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1518/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.8348474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:30,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.3% |████████████████████████ | 5.43261 samples/s/p 3:22:02 } +2024-07-25 21:48:33,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1520/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.8342364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:33,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43716 samples/s/p 3:21:49 } +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1522/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.8336255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:36,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43566 samples/s/p 3:21:49 } +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1524/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.8330145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:39,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43625 samples/s/p 3:21:45 } +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1526/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.8324039e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:42,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43785 samples/s/p 3:21:38 } +2024-07-25 21:48:45,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1528/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.8317924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:45,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43347 samples/s/p 3:21:45 } +2024-07-25 21:48:48,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1530/ 1625], loss: 1.245, per_step_time: 1471ms, lr: 1.8311814e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:48,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43573 samples/s/p 3:21:37 } +2024-07-25 21:48:51,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1532/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.8305704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:51,219 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.43699 samples/s/p 3:21:31 } +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1534/ 1625], loss: 0.995, per_step_time: 1469ms, lr: 1.8299592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:54,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.4% |████████████████████████ | 5.44326 samples/s/p 3:21:15 } +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1536/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.8293478e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:48:57,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43675 samples/s/p 3:21:26 } +2024-07-25 21:49:00,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1538/ 1625], loss: 1.015, per_step_time: 1471ms, lr: 1.8287366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:00,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43754 samples/s/p 3:21:21 } +2024-07-25 21:49:03,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1540/ 1625], loss: 1.409, per_step_time: 1473ms, lr: 1.8281251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:03,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43037 samples/s/p 3:21:34 } +2024-07-25 21:49:05,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1542/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 1.8275137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:05,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43527 samples/s/p 3:21:21 } +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1544/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.8269022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:08,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43331 samples/s/p 3:21:22 } +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1546/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.8262908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:11,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43455 samples/s/p 3:21:16 } +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1548/ 1625], loss: 1.337, per_step_time: 1473ms, lr: 1.8256795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:14,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43101 samples/s/p 3:21:21 } +2024-07-25 21:49:17,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1550/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.8250676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:17,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.5% |████████████████████████ | 5.43219 samples/s/p 3:21:16 } +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1552/ 1625], loss: 0.950, per_step_time: 1470ms, lr: 1.824456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:20,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44020 samples/s/p 3:20:55 } +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1554/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 1.8238445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:23,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43538 samples/s/p 3:21:03 } +2024-07-25 21:49:26,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1556/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.8232326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:26,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43401 samples/s/p 3:21:03 } +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1558/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.8226207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:29,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43213 samples/s/p 3:21:04 } +2024-07-25 21:49:32,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1560/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.822009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:32,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43720 samples/s/p 3:20:50 } +2024-07-25 21:49:35,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1562/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 1.8213968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:35,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43617 samples/s/p 3:20:49 } +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1564/ 1625], loss: 1.295, per_step_time: 1474ms, lr: 1.820785e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:38,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.42663 samples/s/p 3:21:07 } +2024-07-25 21:49:41,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1566/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.8201728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:41,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.43387 samples/s/p 3:20:48 } +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1568/ 1625], loss: 1.305, per_step_time: 1470ms, lr: 1.8195607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:44,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.6% |████████████████████████ | 5.44139 samples/s/p 3:20:29 } +2024-07-25 21:49:47,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1570/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.8189487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:47,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43694 samples/s/p 3:20:36 } +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1572/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8183366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:50,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43144 samples/s/p 3:20:45 } +2024-07-25 21:49:53,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1574/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.8177245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:53,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43354 samples/s/p 3:20:37 } +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1576/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 1.8171122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:56,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43431 samples/s/p 3:20:33 } +2024-07-25 21:49:59,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1578/ 1625], loss: 0.957, per_step_time: 1471ms, lr: 1.8165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:49:59,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43661 samples/s/p 3:20:25 } +2024-07-25 21:50:02,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1580/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.8158873e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:02,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43851 samples/s/p 3:20:18 } +2024-07-25 21:50:04,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1582/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 1.815275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:04,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.44122 samples/s/p 3:20:09 } +2024-07-25 21:50:07,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1584/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.8146626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:07,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.7% |████████████████████████ | 5.43683 samples/s/p 3:20:15 } +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1586/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.8140501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:10,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43961 samples/s/p 3:20:06 } +2024-07-25 21:50:13,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1588/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.8134375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.42950 samples/s/p 3:20:26 } +2024-07-25 21:50:16,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1590/ 1625], loss: 1.226, per_step_time: 1469ms, lr: 1.8128248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:16,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.44447 samples/s/p 3:19:50 } +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1592/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.8122122e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:19,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43743 samples/s/p 3:20:02 } +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1594/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 1.8115996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43368 samples/s/p 3:20:08 } +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1596/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.8109868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:25,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43409 samples/s/p 3:20:04 } +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1598/ 1625], loss: 1.319, per_step_time: 1471ms, lr: 1.8103741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43564 samples/s/p 3:19:57 } +2024-07-25 21:50:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1600/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 1.8097613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.8% |████████████████████████ | 5.43093 samples/s/p 3:20:05 } +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1602/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.8091481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:34,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43547 samples/s/p 3:19:52 } +2024-07-25 21:50:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1604/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8085353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:37,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43386 samples/s/p 3:19:52 } +2024-07-25 21:50:40,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1606/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.8079225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:40,393 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43634 samples/s/p 3:19:44 } +2024-07-25 21:50:43,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1608/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.8073093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:43,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43491 samples/s/p 3:19:44 } +2024-07-25 21:50:46,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1610/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 1.8066961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:46,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43883 samples/s/p 3:19:33 } +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1612/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.8060831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:49,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43577 samples/s/p 3:19:36 } +2024-07-25 21:50:52,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1614/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.8054698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:52,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43767 samples/s/p 3:19:29 } +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1616/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.8048568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:55,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 49.9% |████████████████████████ | 5.43314 samples/s/p 3:19:36 } +2024-07-25 21:50:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1618/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.8042434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:50:58,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43415 samples/s/p 3:19:31 } +2024-07-25 21:51:01,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1620/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.8036299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:01,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44166 samples/s/p 3:19:12 } +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1622/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.8030169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:03,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.43371 samples/s/p 3:19:26 } +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 5/ 10], step:[ 1624/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 1.8024031e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:06,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |████████████████████████ | 5.44162 samples/s/p 3:19:06 } +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.80179e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:09,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43674 samples/s/p 3:19:14 } +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 3/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.8011764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:12,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43581 samples/s/p 3:19:13 } +2024-07-25 21:51:15,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 5/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.8005629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:15,794 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43266 samples/s/p 3:19:17 } +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 7/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7999491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.0% |█████████████████████████ | 5.43724 samples/s/p 3:19:04 } +2024-07-25 21:51:21,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 9/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 1.7993356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:21,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43338 samples/s/p 3:19:09 } +2024-07-25 21:51:24,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 11/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.7987217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:24,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.44210 samples/s/p 3:18:47 } +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 13/ 1625], loss: 1.056, per_step_time: 1475ms, lr: 1.798108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:27,600 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42097 samples/s/p 3:19:31 } +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 15/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.7974944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:30,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43296 samples/s/p 3:19:01 } +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 17/ 1625], loss: 0.984, per_step_time: 1470ms, lr: 1.7968803e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:33,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43866 samples/s/p 3:18:46 } +2024-07-25 21:51:36,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 19/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.7962668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:36,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.42939 samples/s/p 3:19:03 } +2024-07-25 21:51:39,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 21/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.7956525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:39,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43835 samples/s/p 3:18:41 } +2024-07-25 21:51:42,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 23/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 1.7950388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:42,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.1% |█████████████████████████ | 5.43453 samples/s/p 3:18:46 } +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 25/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.7944249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:45,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43753 samples/s/p 3:18:37 } +2024-07-25 21:51:48,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 27/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7938106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:48,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43870 samples/s/p 3:18:31 } +2024-07-25 21:51:51,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 29/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 1.7931965e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:51,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43500 samples/s/p 3:18:36 } +2024-07-25 21:51:54,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 31/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.7925824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:54,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43413 samples/s/p 3:18:35 } +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 33/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.7919681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:51:57,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43184 samples/s/p 3:18:37 } +2024-07-25 21:52:00,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 35/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 1.7913539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:00,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43013 samples/s/p 3:18:38 } +2024-07-25 21:52:03,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 37/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 1.7907396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:03,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43122 samples/s/p 3:18:33 } +2024-07-25 21:52:05,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 39/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 1.7901253e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:05,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.2% |█████████████████████████ | 5.43383 samples/s/p 3:18:24 } +2024-07-25 21:52:08,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 41/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 1.789511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:08,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43520 samples/s/p 3:18:18 } +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 43/ 1625], loss: 1.354, per_step_time: 1470ms, lr: 1.7888964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:11,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44103 samples/s/p 3:18:03 } +2024-07-25 21:52:14,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 45/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 1.788282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:14,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43986 samples/s/p 3:18:02 } +2024-07-25 21:52:17,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 47/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.7876677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:17,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43375 samples/s/p 3:18:13 } +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 49/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.787053e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:20,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43575 samples/s/p 3:18:05 } +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 51/ 1625], loss: 1.256, per_step_time: 1475ms, lr: 1.7864384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:23,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.42360 samples/s/p 3:18:29 } +2024-07-25 21:52:26,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 53/ 1625], loss: 1.194, per_step_time: 1468ms, lr: 1.7858238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:26,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.44621 samples/s/p 3:17:37 } +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 55/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 1.7852091e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:29,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.3% |█████████████████████████ | 5.43489 samples/s/p 3:17:58 } +2024-07-25 21:52:32,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 57/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7845947e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:32,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43601 samples/s/p 3:17:53 } +2024-07-25 21:52:35,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 59/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 1.7839797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:35,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43072 samples/s/p 3:18:02 } +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 61/ 1625], loss: 1.065, per_step_time: 1473ms, lr: 1.7833649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:38,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.42890 samples/s/p 3:18:03 } +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 63/ 1625], loss: 1.351, per_step_time: 1473ms, lr: 1.78275e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:41,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43040 samples/s/p 3:17:56 } +2024-07-25 21:52:44,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 65/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.7821352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:44,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43905 samples/s/p 3:17:35 } +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 67/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.78152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:47,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43734 samples/s/p 3:17:35 } +2024-07-25 21:52:50,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 69/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.7809052e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:50,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43752 samples/s/p 3:17:32 } +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 71/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.7802902e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:53,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.43765 samples/s/p 3:17:29 } +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 73/ 1625], loss: 1.242, per_step_time: 1482ms, lr: 1.7796752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:56,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.4% |█████████████████████████ | 5.39743 samples/s/p 3:18:54 } +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 75/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.77906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:52:59,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43915 samples/s/p 3:17:20 } +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 77/ 1625], loss: 0.873, per_step_time: 1470ms, lr: 1.7784449e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:02,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44177 samples/s/p 3:17:11 } +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 79/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.7778299e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:04,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43842 samples/s/p 3:17:15 } +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 81/ 1625], loss: 1.112, per_step_time: 1469ms, lr: 1.7772145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:07,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44330 samples/s/p 3:17:02 } +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 83/ 1625], loss: 1.101, per_step_time: 1470ms, lr: 1.7765991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:10,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43887 samples/s/p 3:17:08 } +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 85/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.775984e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:13,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43443 samples/s/p 3:17:15 } +2024-07-25 21:53:16,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 87/ 1625], loss: 1.158, per_step_time: 1469ms, lr: 1.7753686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.44284 samples/s/p 3:16:54 } +2024-07-25 21:53:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 89/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.774753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:19,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.5% |█████████████████████████ | 5.43358 samples/s/p 3:17:11 } +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 91/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.7741377e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:22,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.44198 samples/s/p 3:16:50 } +2024-07-25 21:53:25,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 93/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.7735223e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:25,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43421 samples/s/p 3:17:04 } +2024-07-25 21:53:28,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 95/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.7729066e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:28,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43214 samples/s/p 3:17:05 } +2024-07-25 21:53:31,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 97/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.772291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:31,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43332 samples/s/p 3:17:00 } +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 99/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.7716755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:34,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43136 samples/s/p 3:17:01 } +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 101/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.77106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:37,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43695 samples/s/p 3:16:46 } +2024-07-25 21:53:40,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 103/ 1625], loss: 1.210, per_step_time: 1471ms, lr: 1.7704442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:40,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43837 samples/s/p 3:16:40 } +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 105/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.7698285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:43,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.6% |█████████████████████████ | 5.43495 samples/s/p 3:16:45 } +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 107/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7692128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:46,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43929 samples/s/p 3:16:32 } +2024-07-25 21:53:49,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 109/ 1625], loss: 1.241, per_step_time: 1470ms, lr: 1.768597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:49,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43907 samples/s/p 3:16:30 } +2024-07-25 21:53:52,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 111/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.767981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:52,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43430 samples/s/p 3:16:37 } +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 113/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 1.7673652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:55,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43711 samples/s/p 3:16:28 } +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 115/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7667493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:53:58,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.42906 samples/s/p 3:16:43 } +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 117/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.7661332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:01,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43117 samples/s/p 3:16:35 } +2024-07-25 21:54:03,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 119/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.7655173e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:04,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43363 samples/s/p 3:16:27 } +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 121/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 1.764901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:06,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.7% |█████████████████████████ | 5.43010 samples/s/p 3:16:32 } +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 123/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7642853e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:09,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43064 samples/s/p 3:16:27 } +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 1.763669e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:12,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43129 samples/s/p 3:16:23 } +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 127/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.7630528e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:15,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43807 samples/s/p 3:16:05 } +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 129/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7624367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:18,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43159 samples/s/p 3:16:17 } +2024-07-25 21:54:21,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 131/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.7618206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:21,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43124 samples/s/p 3:16:14 } +2024-07-25 21:54:24,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 133/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.761204e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:24,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.42945 samples/s/p 3:16:15 } +2024-07-25 21:54:27,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 135/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7605877e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:27,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43293 samples/s/p 3:16:05 } +2024-07-25 21:54:30,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 137/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.7599716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:30,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.8% |█████████████████████████ | 5.43157 samples/s/p 3:16:05 } +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 139/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.759355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:33,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43723 samples/s/p 3:15:50 } +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 141/ 1625], loss: 1.364, per_step_time: 1471ms, lr: 1.7587385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:36,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43824 samples/s/p 3:15:44 } +2024-07-25 21:54:39,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 143/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7581222e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:39,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43578 samples/s/p 3:15:47 } +2024-07-25 21:54:42,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 145/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.7575056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:42,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43808 samples/s/p 3:15:39 } +2024-07-25 21:54:45,321 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 147/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.756889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:45,322 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43558 samples/s/p 3:15:41 } +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 149/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.7562725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:48,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43541 samples/s/p 3:15:39 } +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 151/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.7556558e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:51,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43543 samples/s/p 3:15:36 } +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 153/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.7550392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:54,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 50.9% |█████████████████████████ | 5.43825 samples/s/p 3:15:27 } +2024-07-25 21:54:57,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 155/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.7544224e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:54:57,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43210 samples/s/p 3:15:37 } +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 157/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 1.7538056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:00,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.41695 samples/s/p 3:16:07 } +2024-07-25 21:55:03,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 159/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.753189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43821 samples/s/p 3:15:18 } +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 161/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.7525721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:05,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43291 samples/s/p 3:15:27 } +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 163/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 1.7519553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:08,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43410 samples/s/p 3:15:21 } +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 165/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7513383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:11,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43743 samples/s/p 3:15:11 } +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 167/ 1625], loss: 1.230, per_step_time: 1473ms, lr: 1.7507215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:14,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43043 samples/s/p 3:15:23 } +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 169/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.7501043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:17,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.0% |█████████████████████████ | 5.43317 samples/s/p 3:15:14 } +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 171/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.7494875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:20,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43398 samples/s/p 3:15:10 } +2024-07-25 21:55:23,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 173/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.7488705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:23,695 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43567 samples/s/p 3:15:03 } +2024-07-25 21:55:26,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 175/ 1625], loss: 1.275, per_step_time: 1469ms, lr: 1.7482535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:26,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.44256 samples/s/p 3:14:45 } +2024-07-25 21:55:29,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 177/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.7476359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43522 samples/s/p 3:14:58 } +2024-07-25 21:55:32,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 179/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.747019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:32,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42766 samples/s/p 3:15:11 } +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 181/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 1.7464017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:35,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43263 samples/s/p 3:14:58 } +2024-07-25 21:55:38,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 183/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 1.7457845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:38,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.43580 samples/s/p 3:14:48 } +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 185/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 1.7451674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:41,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.1% |█████████████████████████ | 5.42630 samples/s/p 3:15:05 } +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 187/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.74455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:44,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43266 samples/s/p 3:14:49 } +2024-07-25 21:55:47,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 189/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 1.7439326e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:47,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43729 samples/s/p 3:14:36 } +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 191/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.7433153e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:50,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43782 samples/s/p 3:14:32 } +2024-07-25 21:55:53,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 193/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.7426979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:53,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43335 samples/s/p 3:14:38 } +2024-07-25 21:55:56,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 195/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.7420805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:56,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43674 samples/s/p 3:14:28 } +2024-07-25 21:55:59,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 197/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.741463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:55:59,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44029 samples/s/p 3:14:18 } +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 199/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.7408454e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:02,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43524 samples/s/p 3:14:26 } +2024-07-25 21:56:05,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 201/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.740228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:05,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.43200 samples/s/p 3:14:30 } +2024-07-25 21:56:07,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 203/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.7396103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:07,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.2% |█████████████████████████ | 5.44030 samples/s/p 3:14:09 } +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 205/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.7389928e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:10,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.42994 samples/s/p 3:14:28 } +2024-07-25 21:56:13,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 207/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.7383752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:13,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43534 samples/s/p 3:14:14 } +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 209/ 1625], loss: 1.209, per_step_time: 1471ms, lr: 1.7377573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:16,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43772 samples/s/p 3:14:06 } +2024-07-25 21:56:19,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 211/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.7371396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:19,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43135 samples/s/p 3:14:16 } +2024-07-25 21:56:22,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 213/ 1625], loss: 1.324, per_step_time: 1472ms, lr: 1.7365219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:22,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43115 samples/s/p 3:14:14 } +2024-07-25 21:56:25,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 215/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.735904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:25,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43297 samples/s/p 3:14:07 } +2024-07-25 21:56:28,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 217/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.7352862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:28,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43089 samples/s/p 3:14:08 } +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 219/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 1.7346685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:31,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.3% |█████████████████████████ | 5.43405 samples/s/p 3:13:59 } +2024-07-25 21:56:34,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 221/ 1625], loss: 1.076, per_step_time: 1473ms, lr: 1.7340506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:34,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42972 samples/s/p 3:14:05 } +2024-07-25 21:56:37,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 223/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.7334327e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:37,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43293 samples/s/p 3:13:55 } +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 225/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.7328146e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:40,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43928 samples/s/p 3:13:39 } +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 227/ 1625], loss: 1.229, per_step_time: 1475ms, lr: 1.7321967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:43,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.42341 samples/s/p 3:14:10 } +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 229/ 1625], loss: 0.899, per_step_time: 1471ms, lr: 1.7315788e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:46,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43490 samples/s/p 3:13:42 } +2024-07-25 21:56:49,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 231/ 1625], loss: 0.989, per_step_time: 1469ms, lr: 1.7309607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:49,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.44319 samples/s/p 3:13:22 } +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 233/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.7303424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:52,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43740 samples/s/p 3:13:31 } +2024-07-25 21:56:55,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 235/ 1625], loss: 1.290, per_step_time: 1470ms, lr: 1.7297245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:55,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.4% |█████████████████████████ | 5.43852 samples/s/p 3:13:26 } +2024-07-25 21:56:58,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 237/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.729106e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:56:58,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44216 samples/s/p 3:13:15 } +2024-07-25 21:57:01,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 239/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 1.728488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:01,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43061 samples/s/p 3:13:37 } +2024-07-25 21:57:04,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 241/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.7278699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:04,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43274 samples/s/p 3:13:29 } +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 243/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 1.7272516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:06,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43186 samples/s/p 3:13:28 } +2024-07-25 21:57:09,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 245/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.7266331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:09,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43942 samples/s/p 3:13:09 } +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 247/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.7260149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:12,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44078 samples/s/p 3:13:03 } +2024-07-25 21:57:15,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 249/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.7253966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:15,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.43777 samples/s/p 3:13:07 } +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 251/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.7247781e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:18,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.5% |█████████████████████████ | 5.44131 samples/s/p 3:12:56 } +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 253/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.7241597e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:21,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43223 samples/s/p 3:13:13 } +2024-07-25 21:57:24,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 255/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.7235412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:24,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43920 samples/s/p 3:12:55 } +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 257/ 1625], loss: 1.069, per_step_time: 1474ms, lr: 1.722923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:27,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.42595 samples/s/p 3:13:20 } +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 259/ 1625], loss: 1.322, per_step_time: 1470ms, lr: 1.7223043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:30,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43993 samples/s/p 3:12:47 } +2024-07-25 21:57:33,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 261/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.7216857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:33,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43224 samples/s/p 3:13:01 } +2024-07-25 21:57:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 263/ 1625], loss: 1.325, per_step_time: 1471ms, lr: 1.7210672e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:36,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43770 samples/s/p 3:12:46 } +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 265/ 1625], loss: 1.091, per_step_time: 1470ms, lr: 1.7204486e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43994 samples/s/p 3:12:38 } +2024-07-25 21:57:42,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 267/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.7198297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:42,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.6% |█████████████████████████ | 5.43342 samples/s/p 3:12:49 } +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 269/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 1.7192113e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:45,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43705 samples/s/p 3:12:39 } +2024-07-25 21:57:48,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 271/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 1.7185926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:48,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43387 samples/s/p 3:12:43 } +2024-07-25 21:57:51,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 273/ 1625], loss: 1.273, per_step_time: 1471ms, lr: 1.7179738e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43836 samples/s/p 3:12:30 } +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 275/ 1625], loss: 1.379, per_step_time: 1471ms, lr: 1.717355e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:57:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43734 samples/s/p 3:12:29 } +2024-07-25 21:57:54,186 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 277/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 1.7167362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:30,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.44305 samples/s/p 3:12:14 } +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 279/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 1.7161175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:32,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.42958 samples/s/p 3:12:40 } +2024-07-25 21:58:35,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 281/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.7154985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:36,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43684 samples/s/p 3:12:22 } +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 283/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.7148795e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:39,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.7% |█████████████████████████ | 5.43728 samples/s/p 3:12:18 } +2024-07-25 21:58:42,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 285/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.7142607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:42,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44091 samples/s/p 3:12:07 } +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 287/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.7136417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:45,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43207 samples/s/p 3:12:23 } +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 289/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.7130225e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:47,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43841 samples/s/p 3:12:06 } +2024-07-25 21:58:50,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 291/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 1.7124037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:50,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43342 samples/s/p 3:12:14 } +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 293/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 1.7117847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:53,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.44060 samples/s/p 3:11:56 } +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 295/ 1625], loss: 0.973, per_step_time: 1470ms, lr: 1.7111655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43855 samples/s/p 3:11:57 } +2024-07-25 21:58:59,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 297/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 1.7105465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:58:59,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43753 samples/s/p 3:11:57 } +2024-07-25 21:59:02,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 299/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.7099273e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:02,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.8% |█████████████████████████ | 5.43478 samples/s/p 3:11:59 } +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 301/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 1.7093083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:05,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44061 samples/s/p 3:11:44 } +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 303/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.708689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:08,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43536 samples/s/p 3:11:52 } +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 305/ 1625], loss: 1.362, per_step_time: 1469ms, lr: 1.7080698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:11,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.44565 samples/s/p 3:11:28 } +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 307/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.7074506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:14,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43608 samples/s/p 3:11:45 } +2024-07-25 21:59:17,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 309/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.7068312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:17,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43541 samples/s/p 3:11:43 } +2024-07-25 21:59:20,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 311/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.7062119e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:20,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43849 samples/s/p 3:11:34 } +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 313/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.7055927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:23,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43707 samples/s/p 3:11:34 } +2024-07-25 21:59:26,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 315/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 1.7049733e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:26,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 51.9% |█████████████████████████ | 5.43215 samples/s/p 3:11:41 } +2024-07-25 21:59:29,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 317/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.704354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:29,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43259 samples/s/p 3:11:38 } +2024-07-25 21:59:32,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 319/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.7037344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:32,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43806 samples/s/p 3:11:23 } +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 321/ 1625], loss: 1.310, per_step_time: 1474ms, lr: 1.703115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:35,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.42523 samples/s/p 3:11:47 } +2024-07-25 21:59:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 323/ 1625], loss: 1.278, per_step_time: 1472ms, lr: 1.7024955e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |█████████████████████████ | 5.43285 samples/s/p 3:11:28 } +2024-07-25 21:59:41,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 325/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 1.701876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:41,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43868 samples/s/p 3:11:13 } +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 327/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.7012564e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:44,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43563 samples/s/p 3:11:16 } +2024-07-25 21:59:46,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 329/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.7006369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:46,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.44019 samples/s/p 3:11:04 } +2024-07-25 21:59:49,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 331/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.7000175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:49,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43330 samples/s/p 3:11:15 } +2024-07-25 21:59:52,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 333/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.6993976e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:52,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.0% |██████████████████████████ | 5.43755 samples/s/p 3:11:03 } +2024-07-25 21:59:55,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 335/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.698778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:55,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43756 samples/s/p 3:11:01 } +2024-07-25 21:59:58,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 337/ 1625], loss: 1.244, per_step_time: 1470ms, lr: 1.6981583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 21:59:58,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.44131 samples/s/p 3:10:50 } +2024-07-25 22:00:01,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 339/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.6975388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:01,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43627 samples/s/p 3:10:57 } +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 341/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.6969188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:04,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43772 samples/s/p 3:10:51 } +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 343/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 1.6962991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:07,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43658 samples/s/p 3:10:51 } +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 345/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.6956794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:10,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43965 samples/s/p 3:10:41 } +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 347/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6950595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:13,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43111 samples/s/p 3:10:56 } +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 349/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.6944396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:16,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.1% |██████████████████████████ | 5.43786 samples/s/p 3:10:39 } +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 351/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 1.69382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:19,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43794 samples/s/p 3:10:36 } +2024-07-25 22:00:22,393 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 353/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.6932001e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:22,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43347 samples/s/p 3:10:43 } +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 355/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.69258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:25,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43766 samples/s/p 3:10:31 } +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 357/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.6919603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:28,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43549 samples/s/p 3:10:33 } +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 359/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.6913402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:31,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43715 samples/s/p 3:10:26 } +2024-07-25 22:00:34,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 361/ 1625], loss: 1.336, per_step_time: 1471ms, lr: 1.6907201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:34,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43636 samples/s/p 3:10:25 } +2024-07-25 22:00:37,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 363/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.6901002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:37,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43843 samples/s/p 3:10:17 } +2024-07-25 22:00:40,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 365/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.68948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:40,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.2% |██████████████████████████ | 5.43585 samples/s/p 3:10:20 } +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 367/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.68886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:43,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43240 samples/s/p 3:10:24 } +2024-07-25 22:00:45,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 369/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.6882399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:45,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43540 samples/s/p 3:10:15 } +2024-07-25 22:00:48,947 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 371/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.6876196e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:48,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43522 samples/s/p 3:10:12 } +2024-07-25 22:00:51,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 373/ 1625], loss: 1.123, per_step_time: 1474ms, lr: 1.6869997e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:51,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42501 samples/s/p 3:10:31 } +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 375/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.6863796e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:54,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.42758 samples/s/p 3:10:23 } +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 377/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.6857595e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:00:57,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43703 samples/s/p 3:10:00 } +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 379/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.685139e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:00,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43113 samples/s/p 3:10:09 } +2024-07-25 22:01:03,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 381/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.6845188e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:03,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.3% |██████████████████████████ | 5.43526 samples/s/p 3:09:58 } +2024-07-25 22:01:06,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 383/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.6838985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:06,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43031 samples/s/p 3:10:05 } +2024-07-25 22:01:09,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 385/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 1.6832782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:09,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42912 samples/s/p 3:10:05 } +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 387/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.682658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:12,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.42798 samples/s/p 3:10:04 } +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 389/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.6820375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:15,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43552 samples/s/p 3:09:45 } +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 391/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.6814174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:18,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43212 samples/s/p 3:09:50 } +2024-07-25 22:01:21,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 393/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.6807968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:21,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43886 samples/s/p 3:09:32 } +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 395/ 1625], loss: 1.084, per_step_time: 1479ms, lr: 1.6801763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:24,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.40632 samples/s/p 3:10:38 } +2024-07-25 22:01:27,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 397/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.679556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.4% |██████████████████████████ | 5.43724 samples/s/p 3:09:30 } +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 399/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6789356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:30,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43381 samples/s/p 3:09:34 } +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 401/ 1625], loss: 1.224, per_step_time: 1475ms, lr: 1.678315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:33,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.42343 samples/s/p 3:09:53 } +2024-07-25 22:01:36,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 403/ 1625], loss: 1.256, per_step_time: 1470ms, lr: 1.6776945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:36,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43931 samples/s/p 3:09:17 } +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 405/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.6770739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:39,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43959 samples/s/p 3:09:13 } +2024-07-25 22:01:42,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 407/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.6764534e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:42,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43407 samples/s/p 3:09:22 } +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 409/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.6758328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:45,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43548 samples/s/p 3:09:16 } +2024-07-25 22:01:48,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 411/ 1625], loss: 1.214, per_step_time: 1483ms, lr: 1.6752121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:48,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.39128 samples/s/p 3:10:46 } +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 413/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.6745917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:50,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.5% |██████████████████████████ | 5.43734 samples/s/p 3:09:06 } +2024-07-25 22:01:53,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 415/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.6739708e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:53,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43598 samples/s/p 3:09:06 } +2024-07-25 22:01:56,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 417/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.6733502e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:56,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43998 samples/s/p 3:08:55 } +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 419/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.6727296e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:01:59,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42940 samples/s/p 3:09:14 } +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 421/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.672109e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:02,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43539 samples/s/p 3:08:59 } +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 423/ 1625], loss: 1.291, per_step_time: 1474ms, lr: 1.671488e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:05,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.42535 samples/s/p 3:09:17 } +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 425/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.6708673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:08,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43769 samples/s/p 3:08:48 } +2024-07-25 22:02:11,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 427/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.6702465e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:11,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43730 samples/s/p 3:08:46 } +2024-07-25 22:02:14,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 429/ 1625], loss: 1.089, per_step_time: 1473ms, lr: 1.6696256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:14,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.6% |██████████████████████████ | 5.43015 samples/s/p 3:08:58 } +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 431/ 1625], loss: 1.230, per_step_time: 1474ms, lr: 1.6690048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:17,541 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.42490 samples/s/p 3:09:06 } +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 433/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.6683838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43169 samples/s/p 3:08:49 } +2024-07-25 22:02:23,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 435/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.6677632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:23,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43469 samples/s/p 3:08:39 } +2024-07-25 22:02:26,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 437/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.6671422e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:26,397 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43329 samples/s/p 3:08:39 } +2024-07-25 22:02:29,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 439/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.6665212e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:29,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43173 samples/s/p 3:08:40 } +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 441/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.6659005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:32,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43506 samples/s/p 3:08:30 } +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 443/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.6652793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:35,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43458 samples/s/p 3:08:28 } +2024-07-25 22:02:38,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 445/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.6646582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:38,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.7% |██████████████████████████ | 5.43662 samples/s/p 3:08:21 } +2024-07-25 22:02:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 447/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.6640375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:41,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43044 samples/s/p 3:08:31 } +2024-07-25 22:02:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 449/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.6634163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43225 samples/s/p 3:08:24 } +2024-07-25 22:02:47,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 451/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.6627953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:47,058 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43671 samples/s/p 3:08:12 } +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 453/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.6621743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:50,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43233 samples/s/p 3:08:18 } +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 455/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 1.661553e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43531 samples/s/p 3:08:09 } +2024-07-25 22:02:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 457/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 1.6609321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:55,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43585 samples/s/p 3:08:05 } +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 459/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 1.6603108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:02:58,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43343 samples/s/p 3:08:07 } +2024-07-25 22:03:01,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 461/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.6596896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:01,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.44257 samples/s/p 3:07:45 } +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 463/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6590686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:04,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.8% |██████████████████████████ | 5.43502 samples/s/p 3:07:57 } +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 465/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 1.6584474e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:07,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.42971 samples/s/p 3:08:06 } +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 467/ 1625], loss: 0.951, per_step_time: 1472ms, lr: 1.657826e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:10,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43458 samples/s/p 3:07:52 } +2024-07-25 22:03:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 469/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 1.6572048e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:13,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43849 samples/s/p 3:07:41 } +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 471/ 1625], loss: 1.016, per_step_time: 1473ms, lr: 1.6565837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:16,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43040 samples/s/p 3:07:55 } +2024-07-25 22:03:19,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 473/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 1.6559625e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:19,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43182 samples/s/p 3:07:49 } +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 475/ 1625], loss: 1.308, per_step_time: 1472ms, lr: 1.6553411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:22,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43362 samples/s/p 3:07:43 } +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 477/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.6547197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:25,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43518 samples/s/p 3:07:37 } +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 479/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.6540986e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:28,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 52.9% |██████████████████████████ | 5.43583 samples/s/p 3:07:32 } +2024-07-25 22:03:31,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 481/ 1625], loss: 1.252, per_step_time: 1476ms, lr: 1.653477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:31,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.41699 samples/s/p 3:08:08 } +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 483/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.6528556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:34,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43139 samples/s/p 3:07:36 } +2024-07-25 22:03:37,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 485/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 1.6522345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:37,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43426 samples/s/p 3:07:27 } +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 487/ 1625], loss: 1.072, per_step_time: 1484ms, lr: 1.651613e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:40,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.39015 samples/s/p 3:08:56 } +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 489/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.6509914e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:43,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43230 samples/s/p 3:07:25 } +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 491/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.6503702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:46,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43684 samples/s/p 3:07:12 } +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 493/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 1.6497484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:49,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43973 samples/s/p 3:07:04 } +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 495/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.649127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:52,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.0% |██████████████████████████ | 5.43832 samples/s/p 3:07:04 } +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 497/ 1625], loss: 1.268, per_step_time: 1471ms, lr: 1.6485055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:54,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43673 samples/s/p 3:07:04 } +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 499/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.6478842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:03:57,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43681 samples/s/p 3:07:01 } +2024-07-25 22:04:00,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.6472628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:00,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.42410 samples/s/p 3:07:24 } +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 503/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 1.6466409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:03,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43918 samples/s/p 3:06:50 } +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 505/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.6460193e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:06,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43220 samples/s/p 3:07:01 } +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 507/ 1625], loss: 1.141, per_step_time: 1470ms, lr: 1.645398e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:09,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.44026 samples/s/p 3:06:42 } +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 509/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.6447762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:12,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43234 samples/s/p 3:06:55 } +2024-07-25 22:04:15,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 511/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.6441545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:15,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.1% |██████████████████████████ | 5.43183 samples/s/p 3:06:53 } +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 513/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 1.6435331e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:18,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43738 samples/s/p 3:06:39 } +2024-07-25 22:04:21,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 515/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 1.6429112e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:21,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43505 samples/s/p 3:06:41 } +2024-07-25 22:04:24,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 517/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.6422895e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:24,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43155 samples/s/p 3:06:45 } +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 519/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.641668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:27,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43146 samples/s/p 3:06:42 } +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 521/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.6410462e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:30,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43468 samples/s/p 3:06:33 } +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 523/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.6404245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:33,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43304 samples/s/p 3:06:33 } +2024-07-25 22:04:36,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 525/ 1625], loss: 1.376, per_step_time: 1473ms, lr: 1.6398028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:36,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.42766 samples/s/p 3:06:41 } +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 527/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 1.639181e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:39,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.2% |██████████████████████████ | 5.43118 samples/s/p 3:06:31 } +2024-07-25 22:04:42,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 529/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 1.6385593e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:42,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44103 samples/s/p 3:06:08 } +2024-07-25 22:04:45,139 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 531/ 1625], loss: 1.436, per_step_time: 1473ms, lr: 1.6379374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:45,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43075 samples/s/p 3:06:26 } +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 533/ 1625], loss: 1.165, per_step_time: 1470ms, lr: 1.6373155e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:48,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43872 samples/s/p 3:06:07 } +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 535/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 1.6366937e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:51,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43826 samples/s/p 3:06:05 } +2024-07-25 22:04:53,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 537/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.636072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:53,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.44147 samples/s/p 3:05:55 } +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 539/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.6354501e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:56,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43881 samples/s/p 3:05:58 } +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 541/ 1625], loss: 1.300, per_step_time: 1471ms, lr: 1.6348282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:04:59,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43559 samples/s/p 3:06:01 } +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 543/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.6342063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:02,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.3% |██████████████████████████ | 5.43189 samples/s/p 3:06:06 } +2024-07-25 22:05:05,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 545/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.6335844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:05,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.44062 samples/s/p 3:05:45 } +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 547/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.6329626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:08,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43199 samples/s/p 3:06:00 } +2024-07-25 22:05:11,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 549/ 1625], loss: 1.330, per_step_time: 1471ms, lr: 1.6323405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:11,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43596 samples/s/p 3:05:49 } +2024-07-25 22:05:14,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 551/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.6317186e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:14,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43597 samples/s/p 3:05:46 } +2024-07-25 22:05:17,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 553/ 1625], loss: 1.262, per_step_time: 1474ms, lr: 1.6310967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:17,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42392 samples/s/p 3:06:08 } +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 555/ 1625], loss: 1.357, per_step_time: 1470ms, lr: 1.6304746e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:20,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43909 samples/s/p 3:05:34 } +2024-07-25 22:05:23,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 557/ 1625], loss: 1.058, per_step_time: 1475ms, lr: 1.6298527e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:23,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.42211 samples/s/p 3:06:06 } +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 559/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.6292306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:26,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.4% |██████████████████████████ | 5.43538 samples/s/p 3:05:35 } +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 561/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.6286087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:29,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42803 samples/s/p 3:05:48 } +2024-07-25 22:05:32,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 563/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.6279866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:32,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43518 samples/s/p 3:05:30 } +2024-07-25 22:05:35,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 565/ 1625], loss: 0.905, per_step_time: 1471ms, lr: 1.6273645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:35,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43626 samples/s/p 3:05:25 } +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 567/ 1625], loss: 1.168, per_step_time: 1473ms, lr: 1.6267424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:38,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42843 samples/s/p 3:05:38 } +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 569/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.6261205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:41,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43277 samples/s/p 3:05:26 } +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 571/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6254982e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:44,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.43855 samples/s/p 3:05:11 } +2024-07-25 22:05:47,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 573/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 1.6248761e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:47,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.44065 samples/s/p 3:05:04 } +2024-07-25 22:05:50,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 575/ 1625], loss: 1.241, per_step_time: 1474ms, lr: 1.6242542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:50,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.5% |██████████████████████████ | 5.42534 samples/s/p 3:05:32 } +2024-07-25 22:05:53,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 577/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 1.623632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:53,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43252 samples/s/p 3:05:15 } +2024-07-25 22:05:55,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 579/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.6230098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:55,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43304 samples/s/p 3:05:11 } +2024-07-25 22:05:58,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 581/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 1.6223876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:05:58,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.42718 samples/s/p 3:05:20 } +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 583/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.6217655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:01,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43572 samples/s/p 3:04:59 } +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 585/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.6211432e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:04,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43327 samples/s/p 3:05:01 } +2024-07-25 22:06:07,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 587/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.6205211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:07,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43680 samples/s/p 3:04:51 } +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 589/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.6198988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:10,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43900 samples/s/p 3:04:44 } +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 591/ 1625], loss: 0.934, per_step_time: 1470ms, lr: 1.6192767e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:13,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.44091 samples/s/p 3:04:37 } +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 593/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.6186543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:16,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.6% |██████████████████████████ | 5.43839 samples/s/p 3:04:39 } +2024-07-25 22:06:19,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.618032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:19,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43134 samples/s/p 3:04:51 } +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 597/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.6174099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:22,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.44027 samples/s/p 3:04:30 } +2024-07-25 22:06:25,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 599/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.6167876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:25,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43968 samples/s/p 3:04:28 } +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 601/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.6161654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:28,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43582 samples/s/p 3:04:33 } +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 603/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6155429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:31,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43460 samples/s/p 3:04:32 } +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 605/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 1.6149206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:34,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43829 samples/s/p 3:04:22 } +2024-07-25 22:06:37,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 607/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.6142983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:37,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43363 samples/s/p 3:04:28 } +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 609/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.6136759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:40,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.7% |██████████████████████████ | 5.43348 samples/s/p 3:04:26 } +2024-07-25 22:06:43,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 611/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6130536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:43,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43933 samples/s/p 3:04:11 } +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 613/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.6124313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:46,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43276 samples/s/p 3:04:21 } +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 615/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.6118087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:49,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44031 samples/s/p 3:04:03 } +2024-07-25 22:06:52,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 617/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.6111862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:52,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.44156 samples/s/p 3:03:58 } +2024-07-25 22:06:54,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 619/ 1625], loss: 1.076, per_step_time: 1475ms, lr: 1.6105641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:54,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42171 samples/s/p 3:04:35 } +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 621/ 1625], loss: 1.093, per_step_time: 1473ms, lr: 1.6099417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:06:57,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.42954 samples/s/p 3:04:16 } +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 623/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.609319e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:00,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43578 samples/s/p 3:04:00 } +2024-07-25 22:07:03,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 625/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.6086968e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:03,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.8% |██████████████████████████ | 5.43421 samples/s/p 3:04:01 } +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 627/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.6080743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:06,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43517 samples/s/p 3:03:56 } +2024-07-25 22:07:09,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 629/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.6074518e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:09,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43240 samples/s/p 3:03:58 } +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 631/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.6068294e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:12,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43332 samples/s/p 3:03:54 } +2024-07-25 22:07:15,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 633/ 1625], loss: 1.459, per_step_time: 1472ms, lr: 1.606207e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:15,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43388 samples/s/p 3:03:50 } +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 635/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.6055847e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:18,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43212 samples/s/p 3:03:50 } +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 637/ 1625], loss: 1.307, per_step_time: 1475ms, lr: 1.6049618e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:21,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42126 samples/s/p 3:04:09 } +2024-07-25 22:07:24,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 639/ 1625], loss: 0.981, per_step_time: 1473ms, lr: 1.6043394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:24,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.42973 samples/s/p 3:03:49 } +2024-07-25 22:07:27,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 641/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.603717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:27,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 53.9% |██████████████████████████ | 5.43598 samples/s/p 3:03:34 } +2024-07-25 22:07:30,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 643/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.6030945e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:30,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43489 samples/s/p 3:03:33 } +2024-07-25 22:07:33,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 645/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.6024716e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:33,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43102 samples/s/p 3:03:38 } +2024-07-25 22:07:36,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 647/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.6018494e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:36,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43383 samples/s/p 3:03:29 } +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 649/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.6012267e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:39,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |██████████████████████████ | 5.43168 samples/s/p 3:03:30 } +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 651/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.600604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:42,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43374 samples/s/p 3:03:23 } +2024-07-25 22:07:45,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 653/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 1.5999816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:45,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43176 samples/s/p 3:03:24 } +2024-07-25 22:07:48,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 655/ 1625], loss: 1.053, per_step_time: 1470ms, lr: 1.599359e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:48,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.44169 samples/s/p 3:03:01 } +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 657/ 1625], loss: 1.057, per_step_time: 1470ms, lr: 1.5987367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:51,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.0% |███████████████████████████ | 5.43991 samples/s/p 3:03:02 } +2024-07-25 22:07:54,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 659/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5981137e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:54,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43142 samples/s/p 3:03:16 } +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 661/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.597491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:56,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.44106 samples/s/p 3:02:54 } +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 663/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.5968686e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:07:59,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43839 samples/s/p 3:02:56 } +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 665/ 1625], loss: 1.366, per_step_time: 1472ms, lr: 1.596246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:02,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43419 samples/s/p 3:03:02 } +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 667/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.5956231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:05,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43548 samples/s/p 3:02:56 } +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 669/ 1625], loss: 0.984, per_step_time: 1471ms, lr: 1.5950009e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:08,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43644 samples/s/p 3:02:51 } +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 671/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 1.5943782e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:11,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.43939 samples/s/p 3:02:42 } +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 673/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.5937554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:14,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.1% |███████████████████████████ | 5.42723 samples/s/p 3:03:04 } +2024-07-25 22:08:17,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 675/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.5931328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:17,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43802 samples/s/p 3:02:39 } +2024-07-25 22:08:20,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 677/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.59251e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:20,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43395 samples/s/p 3:02:45 } +2024-07-25 22:08:23,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 679/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.5918875e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:23,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43504 samples/s/p 3:02:39 } +2024-07-25 22:08:26,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 681/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.5912645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:26,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43859 samples/s/p 3:02:29 } +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 683/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 1.5906418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:29,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43636 samples/s/p 3:02:31 } +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 685/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 1.5900194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:32,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43061 samples/s/p 3:02:40 } +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 687/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5893967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:35,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43682 samples/s/p 3:02:24 } +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 689/ 1625], loss: 1.229, per_step_time: 1470ms, lr: 1.5887737e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:38,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.2% |███████████████████████████ | 5.43972 samples/s/p 3:02:15 } +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 691/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 1.5881511e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:41,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43089 samples/s/p 3:02:30 } +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 693/ 1625], loss: 0.993, per_step_time: 1471ms, lr: 1.5875283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:44,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43682 samples/s/p 3:02:15 } +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 695/ 1625], loss: 1.366, per_step_time: 1473ms, lr: 1.5869056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:47,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.42969 samples/s/p 3:02:27 } +2024-07-25 22:08:50,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 697/ 1625], loss: 1.421, per_step_time: 1472ms, lr: 1.586283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:50,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43319 samples/s/p 3:02:17 } +2024-07-25 22:08:53,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 699/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5856602e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:53,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43058 samples/s/p 3:02:19 } +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 701/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.5850375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:55,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43372 samples/s/p 3:02:10 } +2024-07-25 22:08:58,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 703/ 1625], loss: 1.276, per_step_time: 1472ms, lr: 1.5844147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:08:58,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43391 samples/s/p 3:02:06 } +2024-07-25 22:09:01,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 705/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.5837917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:01,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.3% |███████████████████████████ | 5.43663 samples/s/p 3:01:58 } +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 707/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.583169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:04,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42805 samples/s/p 3:02:12 } +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 709/ 1625], loss: 1.204, per_step_time: 1474ms, lr: 1.5825464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:07,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42508 samples/s/p 3:02:15 } +2024-07-25 22:09:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 711/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.5819236e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:10,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43190 samples/s/p 3:01:59 } +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 713/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.5813008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:13,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43181 samples/s/p 3:01:56 } +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 715/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.5806778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:16,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43650 samples/s/p 3:01:44 } +2024-07-25 22:09:19,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 717/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.580055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:19,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43527 samples/s/p 3:01:43 } +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 719/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.5794321e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:22,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43336 samples/s/p 3:01:44 } +2024-07-25 22:09:25,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 721/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.5788095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:25,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.43863 samples/s/p 3:01:30 } +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 723/ 1625], loss: 1.309, per_step_time: 1473ms, lr: 1.5781865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:28,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.4% |███████████████████████████ | 5.42935 samples/s/p 3:01:46 } +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 725/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.5775639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:31,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43459 samples/s/p 3:01:33 } +2024-07-25 22:09:34,361 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 727/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.5769408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43386 samples/s/p 3:01:31 } +2024-07-25 22:09:37,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 729/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.576318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:37,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43610 samples/s/p 3:01:24 } +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 731/ 1625], loss: 1.017, per_step_time: 1470ms, lr: 1.5756952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:40,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43887 samples/s/p 3:01:15 } +2024-07-25 22:09:43,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 733/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5750724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:43,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43444 samples/s/p 3:01:21 } +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 735/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.5744496e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:46,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43324 samples/s/p 3:01:21 } +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 737/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.5738266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43245 samples/s/p 3:01:19 } +2024-07-25 22:09:52,063 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 739/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.5732037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:52,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.5% |███████████████████████████ | 5.43945 samples/s/p 3:01:02 } +2024-07-25 22:09:55,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 741/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 1.5725807e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:55,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.44058 samples/s/p 3:00:57 } +2024-07-25 22:09:57,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 743/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.5719581e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:09:57,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42996 samples/s/p 3:01:15 } +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 745/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 1.571335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:00,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43251 samples/s/p 3:01:07 } +2024-07-25 22:10:03,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 747/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 1.5707124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42765 samples/s/p 3:01:14 } +2024-07-25 22:10:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 749/ 1625], loss: 1.139, per_step_time: 1470ms, lr: 1.5700893e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43875 samples/s/p 3:00:49 } +2024-07-25 22:10:09,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 751/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 1.5694664e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:09,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43532 samples/s/p 3:00:53 } +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 753/ 1625], loss: 1.100, per_step_time: 1473ms, lr: 1.5688438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:12,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.42753 samples/s/p 3:01:06 } +2024-07-25 22:10:15,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 755/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.5682208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:15,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.6% |███████████████████████████ | 5.43492 samples/s/p 3:00:48 } +2024-07-25 22:10:18,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 757/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 1.5675978e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:18,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43121 samples/s/p 3:00:52 } +2024-07-25 22:10:21,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 759/ 1625], loss: 1.211, per_step_time: 1475ms, lr: 1.5669748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:21,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42274 samples/s/p 3:01:06 } +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 761/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.566352e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:24,537 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43785 samples/s/p 3:00:33 } +2024-07-25 22:10:27,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 763/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5657291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:27,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43694 samples/s/p 3:00:32 } +2024-07-25 22:10:30,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 765/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 1.5651061e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:30,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43048 samples/s/p 3:00:42 } +2024-07-25 22:10:33,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 767/ 1625], loss: 1.163, per_step_time: 1474ms, lr: 1.5644831e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:33,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.42682 samples/s/p 3:00:46 } +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 769/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.5638603e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:36,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43514 samples/s/p 3:00:27 } +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 771/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.5632373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:39,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.7% |███████████████████████████ | 5.43611 samples/s/p 3:00:22 } +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 773/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.5626145e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:42,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43457 samples/s/p 3:00:22 } +2024-07-25 22:10:45,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 775/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.5619917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:45,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43584 samples/s/p 3:00:17 } +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 777/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 1.5613687e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.44114 samples/s/p 3:00:03 } +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 779/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5607457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:51,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43813 samples/s/p 3:00:06 } +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 781/ 1625], loss: 0.989, per_step_time: 1470ms, lr: 1.5601228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:54,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.44003 samples/s/p 2:59:59 } +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 783/ 1625], loss: 1.234, per_step_time: 1473ms, lr: 1.5594998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.42762 samples/s/p 3:00:21 } +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 785/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.5588768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:10:59,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43413 samples/s/p 3:00:05 } +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 787/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 1.5582538e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:02,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.8% |███████████████████████████ | 5.43072 samples/s/p 3:00:09 } +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 789/ 1625], loss: 1.096, per_step_time: 1470ms, lr: 1.5576308e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:05,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44104 samples/s/p 2:59:46 } +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 791/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 1.5570082e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43816 samples/s/p 2:59:48 } +2024-07-25 22:11:11,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 793/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5563852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44080 samples/s/p 2:59:40 } +2024-07-25 22:11:14,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 795/ 1625], loss: 1.086, per_step_time: 1469ms, lr: 1.5557622e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:14,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.44529 samples/s/p 2:59:28 } +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 797/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5551394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:17,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43697 samples/s/p 2:59:42 } +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 799/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.5545163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:20,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43233 samples/s/p 2:59:48 } +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 801/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.5538935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:23,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43661 samples/s/p 2:59:37 } +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 803/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 1.5532705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:26,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 54.9% |███████████████████████████ | 5.43108 samples/s/p 2:59:45 } +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 805/ 1625], loss: 1.086, per_step_time: 1473ms, lr: 1.5526475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:29,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.42905 samples/s/p 2:59:46 } +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 807/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.5520245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:32,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43662 samples/s/p 2:59:28 } +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 809/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 1.5514017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:35,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43252 samples/s/p 2:59:33 } +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 811/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5507787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:38,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43115 samples/s/p 2:59:33 } +2024-07-25 22:11:41,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 813/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5501559e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:41,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43531 samples/s/p 2:59:22 } +2024-07-25 22:11:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 815/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.5495329e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.44162 samples/s/p 2:59:06 } +2024-07-25 22:11:47,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 817/ 1625], loss: 1.230, per_step_time: 1472ms, lr: 1.5489097e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:47,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43321 samples/s/p 2:59:20 } +2024-07-25 22:11:50,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 819/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 1.5482869e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:50,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.0% |███████████████████████████ | 5.43975 samples/s/p 2:59:04 } +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 821/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.5476639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:53,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.42970 samples/s/p 2:59:21 } +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 823/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5470408e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:56,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43614 samples/s/p 2:59:05 } +2024-07-25 22:11:58,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 825/ 1625], loss: 1.386, per_step_time: 1471ms, lr: 1.546418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:11:58,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43810 samples/s/p 2:58:59 } +2024-07-25 22:12:01,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 827/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.5457952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:01,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43425 samples/s/p 2:59:03 } +2024-07-25 22:12:04,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 829/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.545172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:04,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.44184 samples/s/p 2:58:45 } +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 831/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 1.544549e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:07,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43986 samples/s/p 2:58:46 } +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 833/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.5439264e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:10,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43748 samples/s/p 2:58:48 } +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 835/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.5433032e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:13,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.1% |███████████████████████████ | 5.43139 samples/s/p 2:58:57 } +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 837/ 1625], loss: 1.278, per_step_time: 1473ms, lr: 1.5426804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:16,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43073 samples/s/p 2:58:55 } +2024-07-25 22:12:19,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 839/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 1.5420575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:19,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43555 samples/s/p 2:58:43 } +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 841/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.5414344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:22,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43374 samples/s/p 2:58:44 } +2024-07-25 22:12:25,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 843/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.5408115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:25,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43545 samples/s/p 2:58:37 } +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 845/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.5401885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:28,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.42991 samples/s/p 2:58:45 } +2024-07-25 22:12:31,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 847/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 1.5395655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:31,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.42941 samples/s/p 2:58:43 } +2024-07-25 22:12:34,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 849/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.5389427e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:34,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43564 samples/s/p 2:58:28 } +2024-07-25 22:12:37,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 851/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.5383197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:37,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43690 samples/s/p 2:58:23 } +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 853/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 1.5376969e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:40,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.2% |███████████████████████████ | 5.43525 samples/s/p 2:58:23 } +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 855/ 1625], loss: 1.178, per_step_time: 1468ms, lr: 1.5370739e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:43,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.44609 samples/s/p 2:57:59 } +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 857/ 1625], loss: 1.029, per_step_time: 1470ms, lr: 1.5364512e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:46,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.44020 samples/s/p 2:58:07 } +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 859/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.535828e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:49,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43639 samples/s/p 2:58:12 } +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 861/ 1625], loss: 1.289, per_step_time: 1473ms, lr: 1.535205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:52,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43052 samples/s/p 2:58:21 } +2024-07-25 22:12:55,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 863/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.5345824e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43565 samples/s/p 2:58:07 } +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 865/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 1.5339594e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:12:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43146 samples/s/p 2:58:13 } +2024-07-25 22:13:00,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 867/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.5333366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:00,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.42807 samples/s/p 2:58:16 } +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 869/ 1625], loss: 1.033, per_step_time: 1470ms, lr: 1.5327136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:03,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.3% |███████████████████████████ | 5.43922 samples/s/p 2:57:52 } +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 871/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5320908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43670 samples/s/p 2:57:54 } +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 873/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.5314678e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:09,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43594 samples/s/p 2:57:52 } +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 875/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.5308447e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:12,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43287 samples/s/p 2:57:55 } +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 877/ 1625], loss: 1.084, per_step_time: 1469ms, lr: 1.5302221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:15,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44256 samples/s/p 2:57:33 } +2024-07-25 22:13:18,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 879/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.529599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:18,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44086 samples/s/p 2:57:34 } +2024-07-25 22:13:21,566 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 881/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.5289763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:21,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.44013 samples/s/p 2:57:32 } +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 883/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.5283535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:24,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43887 samples/s/p 2:57:32 } +2024-07-25 22:13:27,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 885/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.5277303e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:27,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.4% |███████████████████████████ | 5.43248 samples/s/p 2:57:41 } +2024-07-25 22:13:30,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 887/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 1.5271076e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:30,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43441 samples/s/p 2:57:35 } +2024-07-25 22:13:33,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 889/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 1.5264846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:33,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43306 samples/s/p 2:57:34 } +2024-07-25 22:13:36,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 891/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.5258617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:36,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43647 samples/s/p 2:57:25 } +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 893/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.525239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:39,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42815 samples/s/p 2:57:38 } +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 895/ 1625], loss: 1.454, per_step_time: 1473ms, lr: 1.5246163e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:42,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.42875 samples/s/p 2:57:34 } +2024-07-25 22:13:45,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 897/ 1625], loss: 1.099, per_step_time: 1469ms, lr: 1.52399325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:45,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.44313 samples/s/p 2:57:03 } +2024-07-25 22:13:48,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 899/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 1.5233704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:48,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43091 samples/s/p 2:57:24 } +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 901/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.5227477e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:51,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.5% |███████████████████████████ | 5.43365 samples/s/p 2:57:15 } +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 903/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.5221247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:54,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43979 samples/s/p 2:57:01 } +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 905/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 1.5215018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:56,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43291 samples/s/p 2:57:11 } +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 907/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 1.5208791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:13:59,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.42858 samples/s/p 2:57:17 } +2024-07-25 22:14:02,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 909/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.5202561e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:02,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43725 samples/s/p 2:56:57 } +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 911/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.5196335e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:05,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43569 samples/s/p 2:56:57 } +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 913/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.5190108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:08,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43659 samples/s/p 2:56:52 } +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 915/ 1625], loss: 1.169, per_step_time: 1472ms, lr: 1.518388e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:11,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43292 samples/s/p 2:56:56 } +2024-07-25 22:14:14,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 917/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.517765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:14,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.6% |███████████████████████████ | 5.43686 samples/s/p 2:56:46 } +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 919/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.5171423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:17,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43736 samples/s/p 2:56:42 } +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 921/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.5165197e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:20,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43460 samples/s/p 2:56:44 } +2024-07-25 22:14:23,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 923/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.5158967e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:23,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43204 samples/s/p 2:56:46 } +2024-07-25 22:14:26,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 925/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5152741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:26,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43619 samples/s/p 2:56:35 } +2024-07-25 22:14:29,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 927/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.5146513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:29,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43339 samples/s/p 2:56:38 } +2024-07-25 22:14:32,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 929/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.5140283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:32,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.44082 samples/s/p 2:56:20 } +2024-07-25 22:14:35,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 931/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.5134057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:35,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.42934 samples/s/p 2:56:40 } +2024-07-25 22:14:38,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 933/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.512783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:38,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.7% |███████████████████████████ | 5.43514 samples/s/p 2:56:25 } +2024-07-25 22:14:41,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 935/ 1625], loss: 0.977, per_step_time: 1470ms, lr: 1.51216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:41,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.44204 samples/s/p 2:56:09 } +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 937/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.51153745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:44,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42854 samples/s/p 2:56:32 } +2024-07-25 22:14:47,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 939/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.5109149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:47,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43742 samples/s/p 2:56:12 } +2024-07-25 22:14:50,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 941/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.510292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:50,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43823 samples/s/p 2:56:08 } +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 943/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.5096692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:53,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.42970 samples/s/p 2:56:21 } +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 945/ 1625], loss: 1.348, per_step_time: 1473ms, lr: 1.5090467e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:56,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43057 samples/s/p 2:56:17 } +2024-07-25 22:14:58,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 947/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 1.5084238e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:14:58,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43427 samples/s/p 2:56:07 } +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 949/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.5078011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:01,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.8% |███████████████████████████ | 5.43795 samples/s/p 2:55:56 } +2024-07-25 22:15:04,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 951/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5071786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:04,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43538 samples/s/p 2:55:58 } +2024-07-25 22:15:07,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 953/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.5065557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:07,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43577 samples/s/p 2:55:55 } +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 955/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.5059332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:10,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43338 samples/s/p 2:55:56 } +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 957/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.5053105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:13,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43494 samples/s/p 2:55:50 } +2024-07-25 22:15:16,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 959/ 1625], loss: 0.950, per_step_time: 1471ms, lr: 1.5046878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:16,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43693 samples/s/p 2:55:44 } +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 961/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5040652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:19,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43416 samples/s/p 2:55:46 } +2024-07-25 22:15:22,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 963/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.5034426e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:22,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.42816 samples/s/p 2:55:55 } +2024-07-25 22:15:25,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 965/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 1.5028201e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:25,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 55.9% |███████████████████████████ | 5.43583 samples/s/p 2:55:37 } +2024-07-25 22:15:28,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 967/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5021974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:28,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43453 samples/s/p 2:55:37 } +2024-07-25 22:15:31,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 969/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.5015748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:31,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43661 samples/s/p 2:55:30 } +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 971/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.5009523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:34,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.43740 samples/s/p 2:55:25 } +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 973/ 1625], loss: 1.243, per_step_time: 1469ms, lr: 1.5003295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:37,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |███████████████████████████ | 5.44338 samples/s/p 2:55:11 } +2024-07-25 22:15:40,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 975/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.499707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:40,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43230 samples/s/p 2:55:29 } +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 977/ 1625], loss: 0.963, per_step_time: 1472ms, lr: 1.4990845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:43,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43372 samples/s/p 2:55:23 } +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 979/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.4984617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:46,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43414 samples/s/p 2:55:20 } +2024-07-25 22:15:49,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 981/ 1625], loss: 1.077, per_step_time: 1471ms, lr: 1.4978394e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:49,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.43574 samples/s/p 2:55:14 } +2024-07-25 22:15:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 983/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.4972169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:52,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.0% |████████████████████████████ | 5.42934 samples/s/p 2:55:23 } +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 985/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.4965942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:55,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43805 samples/s/p 2:55:03 } +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 987/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.4959717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:15:57,969 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43430 samples/s/p 2:55:08 } +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 989/ 1625], loss: 1.030, per_step_time: 1472ms, lr: 1.49534935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:00,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43288 samples/s/p 2:55:07 } +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 991/ 1625], loss: 1.453, per_step_time: 1470ms, lr: 1.4947266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:03,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.44037 samples/s/p 2:54:50 } +2024-07-25 22:16:06,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 993/ 1625], loss: 0.994, per_step_time: 1472ms, lr: 1.4941042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:06,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43362 samples/s/p 2:55:00 } +2024-07-25 22:16:09,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 995/ 1625], loss: 1.162, per_step_time: 1475ms, lr: 1.4934818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:09,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.42366 samples/s/p 2:55:16 } +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 997/ 1625], loss: 1.350, per_step_time: 1471ms, lr: 1.4928592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43714 samples/s/p 2:54:47 } +2024-07-25 22:16:15,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 999/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.4922369e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:15,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.1% |████████████████████████████ | 5.43131 samples/s/p 2:54:56 } +2024-07-25 22:16:18,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1001/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.4916144e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:18,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43392 samples/s/p 2:54:48 } +2024-07-25 22:16:21,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1003/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.4909918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:21,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43551 samples/s/p 2:54:42 } +2024-07-25 22:16:24,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1005/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.4903695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:24,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43971 samples/s/p 2:54:31 } +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1007/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 1.48974705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:27,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43199 samples/s/p 2:54:43 } +2024-07-25 22:16:30,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1009/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 1.4891244e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:30,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43200 samples/s/p 2:54:40 } +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1011/ 1625], loss: 1.242, per_step_time: 1473ms, lr: 1.4885022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:33,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.42835 samples/s/p 2:54:44 } +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1013/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 1.4878799e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:36,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43010 samples/s/p 2:54:37 } +2024-07-25 22:16:39,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1015/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.4872577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:39,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.2% |████████████████████████████ | 5.43213 samples/s/p 2:54:31 } +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1017/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 1.4866351e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:42,246 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43520 samples/s/p 2:54:22 } +2024-07-25 22:16:45,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1019/ 1625], loss: 1.061, per_step_time: 1470ms, lr: 1.4860129e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:45,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43921 samples/s/p 2:54:11 } +2024-07-25 22:16:48,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1021/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.4853906e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:48,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43620 samples/s/p 2:54:14 } +2024-07-25 22:16:51,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1023/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 1.4847682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:51,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43085 samples/s/p 2:54:21 } +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1025/ 1625], loss: 1.158, per_step_time: 1470ms, lr: 1.4841458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:54,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.44113 samples/s/p 2:53:59 } +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1027/ 1625], loss: 1.285, per_step_time: 1473ms, lr: 1.4835237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:56,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43054 samples/s/p 2:54:16 } +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1029/ 1625], loss: 1.255, per_step_time: 1473ms, lr: 1.4829013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:16:59,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.42947 samples/s/p 2:54:15 } +2024-07-25 22:17:02,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1031/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.4822789e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:02,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.3% |████████████████████████████ | 5.43582 samples/s/p 2:54:00 } +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1033/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.4816568e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:05,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43940 samples/s/p 2:53:50 } +2024-07-25 22:17:08,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1035/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 1.4810344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:08,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.44093 samples/s/p 2:53:44 } +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1037/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.4804124e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:11,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43918 samples/s/p 2:53:45 } +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1039/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.4797901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:14,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43451 samples/s/p 2:53:51 } +2024-07-25 22:17:17,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1041/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.4791677e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:17,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.42990 samples/s/p 2:53:57 } +2024-07-25 22:17:20,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1043/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.4785456e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:20,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43300 samples/s/p 2:53:48 } +2024-07-25 22:17:23,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1045/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.4779234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:23,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43847 samples/s/p 2:53:34 } +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1047/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.4773011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:26,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.4% |████████████████████████████ | 5.43182 samples/s/p 2:53:44 } +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1049/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.4766791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:29,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43998 samples/s/p 2:53:25 } +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1051/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.4760571e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:32,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44023 samples/s/p 2:53:22 } +2024-07-25 22:17:35,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1053/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.4754348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:35,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43205 samples/s/p 2:53:35 } +2024-07-25 22:17:38,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1055/ 1625], loss: 1.296, per_step_time: 1469ms, lr: 1.4748127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:38,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.44314 samples/s/p 2:53:11 } +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1057/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.4741907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:41,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43537 samples/s/p 2:53:22 } +2024-07-25 22:17:44,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1059/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.4735684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:44,203 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43356 samples/s/p 2:53:23 } +2024-07-25 22:17:47,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1061/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.4729463e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:47,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.42763 samples/s/p 2:53:31 } +2024-07-25 22:17:50,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1063/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 1.4723245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:50,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.5% |████████████████████████████ | 5.43286 samples/s/p 2:53:18 } +2024-07-25 22:17:53,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1065/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 1.4717026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:53,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43830 samples/s/p 2:53:05 } +2024-07-25 22:17:56,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1067/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 1.4710804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:56,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43151 samples/s/p 2:53:15 } +2024-07-25 22:17:58,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1069/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.4704584e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:17:58,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.44062 samples/s/p 2:52:55 } +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1071/ 1625], loss: 1.319, per_step_time: 1474ms, lr: 1.4698364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:01,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42692 samples/s/p 2:53:18 } +2024-07-25 22:18:04,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1073/ 1625], loss: 1.048, per_step_time: 1474ms, lr: 1.4692143e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:04,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42634 samples/s/p 2:53:16 } +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1075/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4685923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:07,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43153 samples/s/p 2:53:03 } +2024-07-25 22:18:10,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1077/ 1625], loss: 1.056, per_step_time: 1471ms, lr: 1.4679705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:10,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.43697 samples/s/p 2:52:50 } +2024-07-25 22:18:13,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1079/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.4673484e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:13,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.6% |████████████████████████████ | 5.42832 samples/s/p 2:53:04 } +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1081/ 1625], loss: 1.176, per_step_time: 1473ms, lr: 1.4667266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:16,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42891 samples/s/p 2:52:59 } +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1083/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.4661047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:19,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43461 samples/s/p 2:52:46 } +2024-07-25 22:18:22,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1085/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.46548255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:22,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43117 samples/s/p 2:52:49 } +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1087/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.4648608e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:25,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43109 samples/s/p 2:52:46 } +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1089/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.464239e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:28,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43823 samples/s/p 2:52:30 } +2024-07-25 22:18:31,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1091/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.4636169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:31,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43223 samples/s/p 2:52:38 } +2024-07-25 22:18:34,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1093/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.4629953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:34,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.42682 samples/s/p 2:52:46 } +2024-07-25 22:18:37,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1095/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.4623735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:37,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.7% |████████████████████████████ | 5.43810 samples/s/p 2:52:21 } +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1097/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.4617516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:40,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43490 samples/s/p 2:52:24 } +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1099/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.4611298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:43,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43896 samples/s/p 2:52:14 } +2024-07-25 22:18:46,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1101/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 1.46050825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:46,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43881 samples/s/p 2:52:11 } +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1103/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 1.4598862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:49,144 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43224 samples/s/p 2:52:21 } +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1105/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.4592645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:52,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43225 samples/s/p 2:52:18 } +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1107/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.458643e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:55,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43707 samples/s/p 2:52:06 } +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1109/ 1625], loss: 0.965, per_step_time: 1471ms, lr: 1.45802105e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:18:57,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43571 samples/s/p 2:52:05 } +2024-07-25 22:19:00,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1111/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.4573995e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:00,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43927 samples/s/p 2:51:56 } +2024-07-25 22:19:03,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1113/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.4567779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:03,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.8% |████████████████████████████ | 5.43642 samples/s/p 2:51:58 } +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1115/ 1625], loss: 0.994, per_step_time: 1469ms, lr: 1.456156e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:06,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.44306 samples/s/p 2:51:43 } +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1117/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4555345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:09,790 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43837 samples/s/p 2:51:48 } +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1119/ 1625], loss: 1.343, per_step_time: 1471ms, lr: 1.45491285e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:12,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43631 samples/s/p 2:51:49 } +2024-07-25 22:19:15,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1121/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.4542915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:15,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43618 samples/s/p 2:51:47 } +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1123/ 1625], loss: 1.110, per_step_time: 1473ms, lr: 1.4536697e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:18,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43093 samples/s/p 2:51:54 } +2024-07-25 22:19:21,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1125/ 1625], loss: 1.374, per_step_time: 1473ms, lr: 1.4530483e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:21,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43055 samples/s/p 2:51:52 } +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1127/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 1.45242675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:24,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43318 samples/s/p 2:51:44 } +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1129/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.451805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:27,499 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 56.9% |████████████████████████████ | 5.43448 samples/s/p 2:51:38 } +2024-07-25 22:19:30,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1131/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.45118365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:30,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43709 samples/s/p 2:51:30 } +2024-07-25 22:19:33,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1133/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.4505621e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:33,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.42762 samples/s/p 2:51:45 } +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1135/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.4499405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:36,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43299 samples/s/p 2:51:32 } +2024-07-25 22:19:39,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1137/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.4493192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:39,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43519 samples/s/p 2:51:25 } +2024-07-25 22:19:42,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1139/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.4486979e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:42,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43454 samples/s/p 2:51:23 } +2024-07-25 22:19:45,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1141/ 1625], loss: 1.429, per_step_time: 1471ms, lr: 1.4480763e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:45,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43521 samples/s/p 2:51:19 } +2024-07-25 22:19:48,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1143/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.4474548e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:48,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.43658 samples/s/p 2:51:14 } +2024-07-25 22:19:51,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1145/ 1625], loss: 0.981, per_step_time: 1470ms, lr: 1.4468337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:51,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.0% |████████████████████████████ | 5.44016 samples/s/p 2:51:04 } +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1147/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.4462121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:54,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43270 samples/s/p 2:51:15 } +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1149/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.4455908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:57,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43454 samples/s/p 2:51:09 } +2024-07-25 22:19:59,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1151/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 1.4449695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:19:59,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.42741 samples/s/p 2:51:19 } +2024-07-25 22:20:02,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1153/ 1625], loss: 1.078, per_step_time: 1470ms, lr: 1.4443482e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:02,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.44202 samples/s/p 2:50:49 } +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1155/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.443727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:05,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.42705 samples/s/p 2:51:14 } +2024-07-25 22:20:08,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1157/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.4431057e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:08,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43782 samples/s/p 2:50:51 } +2024-07-25 22:20:11,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1159/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.4424842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:11,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43281 samples/s/p 2:50:57 } +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1161/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.4418632e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:14,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.1% |████████████████████████████ | 5.43726 samples/s/p 2:50:46 } +2024-07-25 22:20:17,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1163/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.441242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:17,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43554 samples/s/p 2:50:46 } +2024-07-25 22:20:20,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1165/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.4406206e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:20,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43375 samples/s/p 2:50:47 } +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1167/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.4399996e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:23,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43503 samples/s/p 2:50:41 } +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1169/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.4393786e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:26,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43365 samples/s/p 2:50:41 } +2024-07-25 22:20:29,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1171/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.4387574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:29,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43822 samples/s/p 2:50:29 } +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1173/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.4381362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:32,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43467 samples/s/p 2:50:33 } +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1175/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.4375152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:35,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43166 samples/s/p 2:50:36 } +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1177/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.4368942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:38,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.2% |████████████████████████████ | 5.43671 samples/s/p 2:50:23 } +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1179/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.4362731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:41,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43270 samples/s/p 2:50:28 } +2024-07-25 22:20:44,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1181/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 1.435652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:44,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43662 samples/s/p 2:50:18 } +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1183/ 1625], loss: 1.148, per_step_time: 1474ms, lr: 1.4350312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:47,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42505 samples/s/p 2:50:36 } +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1185/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 1.4344101e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:50,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43425 samples/s/p 2:50:16 } +2024-07-25 22:20:53,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1187/ 1625], loss: 1.237, per_step_time: 1475ms, lr: 1.4337891e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:53,093 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.42183 samples/s/p 2:50:37 } +2024-07-25 22:20:56,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1189/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.4331683e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:56,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43691 samples/s/p 2:50:05 } +2024-07-25 22:20:58,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1191/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.4325473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:20:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43245 samples/s/p 2:50:11 } +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1193/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.4319266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:01,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.3% |████████████████████████████ | 5.43598 samples/s/p 2:50:01 } +2024-07-25 22:21:04,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1195/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.4313056e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:04,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43889 samples/s/p 2:49:53 } +2024-07-25 22:21:07,850 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1197/ 1625], loss: 1.136, per_step_time: 1474ms, lr: 1.43068455e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:07,850 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.42492 samples/s/p 2:50:16 } +2024-07-25 22:21:10,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1199/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.4300639e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:10,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43600 samples/s/p 2:49:52 } +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1201/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.4294431e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:13,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43270 samples/s/p 2:49:56 } +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1203/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.4288221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:16,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43488 samples/s/p 2:49:49 } +2024-07-25 22:21:19,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1205/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 1.4282015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:19,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43758 samples/s/p 2:49:41 } +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1207/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.4275809e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:22,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43293 samples/s/p 2:49:46 } +2024-07-25 22:21:25,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1209/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.42696e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:25,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.4% |████████████████████████████ | 5.43253 samples/s/p 2:49:44 } +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1211/ 1625], loss: 1.000, per_step_time: 1470ms, lr: 1.42633935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:28,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43937 samples/s/p 2:49:28 } +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1213/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.4257189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:31,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43870 samples/s/p 2:49:27 } +2024-07-25 22:21:34,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1215/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.425098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:34,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43191 samples/s/p 2:49:36 } +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1217/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 1.4244773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:37,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43765 samples/s/p 2:49:23 } +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1219/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.423857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:40,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43621 samples/s/p 2:49:22 } +2024-07-25 22:21:43,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1221/ 1625], loss: 0.899, per_step_time: 1470ms, lr: 1.4232365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:43,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43879 samples/s/p 2:49:15 } +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1223/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 1.4226158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:46,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43198 samples/s/p 2:49:24 } +2024-07-25 22:21:49,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1225/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.4219952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:49,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.5% |████████████████████████████ | 5.43570 samples/s/p 2:49:15 } +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1227/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.4213749e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:52,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43258 samples/s/p 2:49:17 } +2024-07-25 22:21:55,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1229/ 1625], loss: 1.179, per_step_time: 1473ms, lr: 1.4207542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:55,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.42947 samples/s/p 2:49:20 } +2024-07-25 22:21:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1231/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.4201337e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:21:58,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43699 samples/s/p 2:49:03 } +2024-07-25 22:22:00,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1233/ 1625], loss: 0.931, per_step_time: 1470ms, lr: 1.4195134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:00,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.44071 samples/s/p 2:48:53 } +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1235/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4188929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:03,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43446 samples/s/p 2:49:02 } +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1237/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.4182727e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:06,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43811 samples/s/p 2:48:52 } +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1239/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.4176523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:09,814 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43963 samples/s/p 2:48:47 } +2024-07-25 22:22:12,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1241/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.4170318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:12,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43785 samples/s/p 2:48:47 } +2024-07-25 22:22:15,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1243/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 1.4164116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:15,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.6% |████████████████████████████ | 5.43065 samples/s/p 2:48:58 } +2024-07-25 22:22:18,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1245/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4157913e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:18,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43501 samples/s/p 2:48:46 } +2024-07-25 22:22:21,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1247/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.41517085e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:21,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43198 samples/s/p 2:48:49 } +2024-07-25 22:22:24,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1249/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.41455075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:24,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43802 samples/s/p 2:48:35 } +2024-07-25 22:22:27,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1251/ 1625], loss: 1.338, per_step_time: 1472ms, lr: 1.4139307e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:27,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43472 samples/s/p 2:48:38 } +2024-07-25 22:22:30,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1253/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.4133103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:30,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43021 samples/s/p 2:48:44 } +2024-07-25 22:22:33,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1255/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.4126901e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:33,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43582 samples/s/p 2:48:30 } +2024-07-25 22:22:36,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1257/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.4120702e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:36,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43237 samples/s/p 2:48:34 } +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1259/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4114499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:39,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.7% |████████████████████████████ | 5.43365 samples/s/p 2:48:28 } +2024-07-25 22:22:42,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1261/ 1625], loss: 1.102, per_step_time: 1474ms, lr: 1.4108297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:42,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42609 samples/s/p 2:48:39 } +2024-07-25 22:22:45,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1263/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.4102098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:45,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43301 samples/s/p 2:48:24 } +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1265/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.4095896e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:48,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43543 samples/s/p 2:48:16 } +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1267/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.4089698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:51,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.42844 samples/s/p 2:48:26 } +2024-07-25 22:22:54,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1269/ 1625], loss: 1.280, per_step_time: 1470ms, lr: 1.4083497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:54,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.44166 samples/s/p 2:47:59 } +2024-07-25 22:22:57,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1271/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.40773e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:57,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43413 samples/s/p 2:48:10 } +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1273/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 1.4071099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:22:59,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43833 samples/s/p 2:47:59 } +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1275/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 1.40649e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:02,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.8% |████████████████████████████ | 5.43812 samples/s/p 2:47:57 } +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1277/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.4058703e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:05,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43429 samples/s/p 2:48:01 } +2024-07-25 22:23:08,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1279/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 1.4052503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:08,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43888 samples/s/p 2:47:49 } +2024-07-25 22:23:11,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1281/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.4046305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:11,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43865 samples/s/p 2:47:47 } +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1283/ 1625], loss: 1.002, per_step_time: 1469ms, lr: 1.4040107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:14,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44378 samples/s/p 2:47:34 } +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1285/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.4033908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:17,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44168 samples/s/p 2:47:35 } +2024-07-25 22:23:20,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1287/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.4027712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:20,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43567 samples/s/p 2:47:43 } +2024-07-25 22:23:23,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1289/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.4021515e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:23,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.43228 samples/s/p 2:47:47 } +2024-07-25 22:23:26,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1291/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4015315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:26,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 57.9% |████████████████████████████ | 5.44178 samples/s/p 2:47:26 } +2024-07-25 22:23:29,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1293/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.4009121e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:29,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42986 samples/s/p 2:47:45 } +2024-07-25 22:23:32,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1295/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.4002926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:32,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43581 samples/s/p 2:47:31 } +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1297/ 1625], loss: 1.238, per_step_time: 1470ms, lr: 1.3996728e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:35,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.43965 samples/s/p 2:47:21 } +2024-07-25 22:23:38,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1299/ 1625], loss: 1.187, per_step_time: 1475ms, lr: 1.3990531e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:38,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |████████████████████████████ | 5.42371 samples/s/p 2:47:48 } +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1301/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.3984339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:41,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.44047 samples/s/p 2:47:14 } +2024-07-25 22:23:44,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1303/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 1.39781405e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:44,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43907 samples/s/p 2:47:14 } +2024-07-25 22:23:47,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1305/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.3971946e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:47,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43275 samples/s/p 2:47:22 } +2024-07-25 22:23:50,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1307/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.3965752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:50,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.0% |█████████████████████████████ | 5.43596 samples/s/p 2:47:13 } +2024-07-25 22:23:53,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1309/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.3959557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:53,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43423 samples/s/p 2:47:14 } +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1311/ 1625], loss: 1.327, per_step_time: 1474ms, lr: 1.3953364e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:56,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.42532 samples/s/p 2:47:27 } +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1313/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.39471695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:23:58,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43751 samples/s/p 2:47:02 } +2024-07-25 22:24:01,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1315/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.3940975e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:01,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.44053 samples/s/p 2:46:53 } +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1317/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 1.3934783e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:04,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43834 samples/s/p 2:46:54 } +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1319/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 1.3928589e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:07,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43667 samples/s/p 2:46:54 } +2024-07-25 22:24:10,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1321/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 1.3922399e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:10,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43552 samples/s/p 2:46:54 } +2024-07-25 22:24:13,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1323/ 1625], loss: 1.333, per_step_time: 1473ms, lr: 1.3916205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:13,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.1% |█████████████████████████████ | 5.43081 samples/s/p 2:46:59 } +2024-07-25 22:24:16,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1325/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 1.3910014e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:16,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43461 samples/s/p 2:46:49 } +2024-07-25 22:24:19,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1327/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.3903823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:19,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43263 samples/s/p 2:46:50 } +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1329/ 1625], loss: 1.335, per_step_time: 1470ms, lr: 1.3897629e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:22,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.44145 samples/s/p 2:46:31 } +2024-07-25 22:24:25,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1331/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.3891439e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:25,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43512 samples/s/p 2:46:40 } +2024-07-25 22:24:28,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1333/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.3885248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:28,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43487 samples/s/p 2:46:37 } +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1335/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 1.38790565e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:31,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43845 samples/s/p 2:46:28 } +2024-07-25 22:24:34,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1337/ 1625], loss: 1.012, per_step_time: 1472ms, lr: 1.3872867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:34,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43227 samples/s/p 2:46:36 } +2024-07-25 22:24:37,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1339/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.3866679e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:37,347 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.2% |█████████████████████████████ | 5.43891 samples/s/p 2:46:21 } +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1341/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.3860487e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:40,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43168 samples/s/p 2:46:31 } +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1343/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.3854297e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:43,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43565 samples/s/p 2:46:21 } +2024-07-25 22:24:46,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1345/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.384811e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:46,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43612 samples/s/p 2:46:17 } +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1347/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.3841919e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:49,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43553 samples/s/p 2:46:15 } +2024-07-25 22:24:52,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1349/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.3835732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:52,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43145 samples/s/p 2:46:20 } +2024-07-25 22:24:55,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1351/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.3829544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:55,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.44207 samples/s/p 2:45:57 } +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1353/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 1.38233545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:24:58,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.42828 samples/s/p 2:46:20 } +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1355/ 1625], loss: 0.868, per_step_time: 1471ms, lr: 1.3817168e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:00,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.3% |█████████████████████████████ | 5.43599 samples/s/p 2:46:03 } +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1357/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.3810981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:03,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43354 samples/s/p 2:46:04 } +2024-07-25 22:25:06,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1359/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.3804793e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:06,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43832 samples/s/p 2:45:53 } +2024-07-25 22:25:09,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1361/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.3798607e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:09,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43416 samples/s/p 2:45:57 } +2024-07-25 22:25:12,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1363/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.3792423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:12,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43742 samples/s/p 2:45:48 } +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1365/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.3786234e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:15,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43832 samples/s/p 2:45:44 } +2024-07-25 22:25:18,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1367/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.3780049e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:18,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43619 samples/s/p 2:45:45 } +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1369/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.3773865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:21,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43388 samples/s/p 2:45:46 } +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1371/ 1625], loss: 1.344, per_step_time: 1472ms, lr: 1.376768e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:24,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43226 samples/s/p 2:45:46 } +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1373/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3761493e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:27,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.4% |█████████████████████████████ | 5.43285 samples/s/p 2:45:42 } +2024-07-25 22:25:30,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1375/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.3755311e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:30,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.42981 samples/s/p 2:45:45 } +2024-07-25 22:25:33,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1377/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.3749128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:33,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43193 samples/s/p 2:45:38 } +2024-07-25 22:25:36,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1379/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.3742942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:36,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.42920 samples/s/p 2:45:40 } +2024-07-25 22:25:39,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1381/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 1.3736759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:39,324 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43645 samples/s/p 2:45:24 } +2024-07-25 22:25:42,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1383/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 1.3730578e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:42,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43447 samples/s/p 2:45:24 } +2024-07-25 22:25:45,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1385/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.3724393e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:45,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43463 samples/s/p 2:45:21 } +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1387/ 1625], loss: 1.092, per_step_time: 1471ms, lr: 1.371821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:48,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43746 samples/s/p 2:45:13 } +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1389/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.371203e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:51,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.5% |█████████████████████████████ | 5.43809 samples/s/p 2:45:09 } +2024-07-25 22:25:54,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1391/ 1625], loss: 1.341, per_step_time: 1472ms, lr: 1.3705846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:54,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43406 samples/s/p 2:45:13 } +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1393/ 1625], loss: 1.158, per_step_time: 1473ms, lr: 1.3699666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:57,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43020 samples/s/p 2:45:17 } +2024-07-25 22:25:59,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1395/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.3693485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:25:59,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43231 samples/s/p 2:45:11 } +2024-07-25 22:26:02,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1397/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3687302e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:02,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43433 samples/s/p 2:45:04 } +2024-07-25 22:26:05,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1399/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.3681123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:05,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43462 samples/s/p 2:45:00 } +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1401/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 1.3674943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:08,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43373 samples/s/p 2:44:59 } +2024-07-25 22:26:11,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1403/ 1625], loss: 1.364, per_step_time: 1473ms, lr: 1.366876e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:11,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.42960 samples/s/p 2:45:04 } +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1405/ 1625], loss: 0.935, per_step_time: 1470ms, lr: 1.3662583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:14,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.6% |█████████████████████████████ | 5.43921 samples/s/p 2:44:43 } +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1407/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.3656406e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:17,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43490 samples/s/p 2:44:48 } +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1409/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.3650226e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:20,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43387 samples/s/p 2:44:47 } +2024-07-25 22:26:23,587 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1411/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.3644046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:23,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43899 samples/s/p 2:44:35 } +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1413/ 1625], loss: 1.189, per_step_time: 1474ms, lr: 1.363787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:26,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42666 samples/s/p 2:44:54 } +2024-07-25 22:26:29,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1415/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.363169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:29,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.42256 samples/s/p 2:44:59 } +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1417/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3625513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:32,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43687 samples/s/p 2:44:30 } +2024-07-25 22:26:35,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1419/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.3619338e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:35,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43550 samples/s/p 2:44:29 } +2024-07-25 22:26:38,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1421/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.3613162e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:38,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.7% |█████████████████████████████ | 5.43646 samples/s/p 2:44:25 } +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1423/ 1625], loss: 0.930, per_step_time: 1471ms, lr: 1.3606985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:41,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43797 samples/s/p 2:44:19 } +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1425/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.36008075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:44,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43670 samples/s/p 2:44:18 } +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1427/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 1.3594635e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:47,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.44138 samples/s/p 2:44:07 } +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1429/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.3588457e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:50,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43124 samples/s/p 2:44:22 } +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1431/ 1625], loss: 1.165, per_step_time: 1473ms, lr: 1.3582282e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:53,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43086 samples/s/p 2:44:20 } +2024-07-25 22:26:56,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1433/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.3576108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:56,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43560 samples/s/p 2:44:09 } +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1435/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.3569933e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:26:59,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43312 samples/s/p 2:44:10 } +2024-07-25 22:27:01,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1437/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 1.356376e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:01,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.8% |█████████████████████████████ | 5.43578 samples/s/p 2:44:02 } +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1439/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.35575865e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:04,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43567 samples/s/p 2:44:00 } +2024-07-25 22:27:07,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1441/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3551411e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:07,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43141 samples/s/p 2:44:04 } +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1443/ 1625], loss: 1.201, per_step_time: 1474ms, lr: 1.3545241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:10,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42446 samples/s/p 2:44:14 } +2024-07-25 22:27:13,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1445/ 1625], loss: 1.307, per_step_time: 1471ms, lr: 1.3539068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:13,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43843 samples/s/p 2:43:46 } +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1447/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.3532894e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:16,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43724 samples/s/p 2:43:45 } +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1449/ 1625], loss: 1.323, per_step_time: 1475ms, lr: 1.3526724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:19,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.42343 samples/s/p 2:44:07 } +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1451/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 1.3520554e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:22,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43816 samples/s/p 2:43:38 } +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1453/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.3514381e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:25,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 58.9% |█████████████████████████████ | 5.43536 samples/s/p 2:43:40 } +2024-07-25 22:27:28,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1455/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.350821e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:28,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43316 samples/s/p 2:43:41 } +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1457/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.3502042e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:31,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43871 samples/s/p 2:43:28 } +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1459/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.349587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:34,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42952 samples/s/p 2:43:41 } +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1461/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 1.34897e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:37,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42872 samples/s/p 2:43:40 } +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1463/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.3483533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:40,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43259 samples/s/p 2:43:30 } +2024-07-25 22:27:43,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1465/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.3477362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:43,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43777 samples/s/p 2:43:18 } +2024-07-25 22:27:46,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1467/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 1.3471195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:46,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.42539 samples/s/p 2:43:37 } +2024-07-25 22:27:49,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1469/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.3465027e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:49,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.0% |█████████████████████████████ | 5.43129 samples/s/p 2:43:23 } +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1471/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.3458862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:52,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43530 samples/s/p 2:43:13 } +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1473/ 1625], loss: 1.191, per_step_time: 1473ms, lr: 1.3452693e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:55,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42922 samples/s/p 2:43:21 } +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1475/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 1.34465245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:27:58,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42886 samples/s/p 2:43:19 } +2024-07-25 22:28:01,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1477/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.344036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:01,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42956 samples/s/p 2:43:15 } +2024-07-25 22:28:03,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1479/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 1.3434192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:03,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43533 samples/s/p 2:43:01 } +2024-07-25 22:28:06,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1481/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3428028e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:06,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43653 samples/s/p 2:42:56 } +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1483/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3421862e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:09,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.43189 samples/s/p 2:43:02 } +2024-07-25 22:28:12,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1485/ 1625], loss: 1.308, per_step_time: 1473ms, lr: 1.3415694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:12,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.1% |█████████████████████████████ | 5.42782 samples/s/p 2:43:06 } +2024-07-25 22:28:15,759 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1487/ 1625], loss: 1.019, per_step_time: 1470ms, lr: 1.3409533e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:15,760 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44001 samples/s/p 2:42:41 } +2024-07-25 22:28:18,708 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1489/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.3403368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:18,709 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43838 samples/s/p 2:42:41 } +2024-07-25 22:28:21,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1491/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.3397202e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:21,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43164 samples/s/p 2:42:50 } +2024-07-25 22:28:24,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1493/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3391041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:24,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43640 samples/s/p 2:42:39 } +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1495/ 1625], loss: 1.274, per_step_time: 1470ms, lr: 1.3384878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:27,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.44021 samples/s/p 2:42:29 } +2024-07-25 22:28:30,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1497/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.3378714e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:30,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43580 samples/s/p 2:42:34 } +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1499/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 1.33725525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:33,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43988 samples/s/p 2:42:24 } +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1501/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 1.3366392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:36,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43799 samples/s/p 2:42:24 } +2024-07-25 22:28:39,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1503/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.3360228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:39,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.2% |█████████████████████████████ | 5.43326 samples/s/p 2:42:30 } +2024-07-25 22:28:42,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1505/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.3354069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:42,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43698 samples/s/p 2:42:20 } +2024-07-25 22:28:45,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1507/ 1625], loss: 1.030, per_step_time: 1469ms, lr: 1.3347908e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:45,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.44420 samples/s/p 2:42:04 } +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1509/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.3341745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:48,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43514 samples/s/p 2:42:18 } +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1511/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.3335588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:51,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.42959 samples/s/p 2:42:25 } +2024-07-25 22:28:54,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1513/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.3329428e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:54,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43163 samples/s/p 2:42:18 } +2024-07-25 22:28:57,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1515/ 1625], loss: 1.112, per_step_time: 1470ms, lr: 1.3323266e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:28:57,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43986 samples/s/p 2:42:00 } +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1517/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.331711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:00,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43836 samples/s/p 2:42:00 } +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1519/ 1625], loss: 0.962, per_step_time: 1471ms, lr: 1.3310952e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:02,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.3% |█████████████████████████████ | 5.43839 samples/s/p 2:41:57 } +2024-07-25 22:29:05,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1521/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 1.3304794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:05,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43409 samples/s/p 2:42:02 } +2024-07-25 22:29:08,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1523/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.3298636e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:08,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44164 samples/s/p 2:41:45 } +2024-07-25 22:29:11,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1525/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.329248e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:11,810 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43209 samples/s/p 2:42:00 } +2024-07-25 22:29:14,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1527/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.3286323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:14,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43129 samples/s/p 2:41:58 } +2024-07-25 22:29:17,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1529/ 1625], loss: 1.232, per_step_time: 1470ms, lr: 1.3280165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:17,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.44050 samples/s/p 2:41:39 } +2024-07-25 22:29:20,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1531/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.3274011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:20,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43167 samples/s/p 2:41:51 } +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1533/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.3267857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:23,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43390 samples/s/p 2:41:45 } +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1535/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.32617e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:26,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.4% |█████████████████████████████ | 5.43068 samples/s/p 2:41:47 } +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1537/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3255545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:29,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.42991 samples/s/p 2:41:46 } +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1539/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.3249392e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:32,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43288 samples/s/p 2:41:37 } +2024-07-25 22:29:35,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1541/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.3243237e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:35,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43687 samples/s/p 2:41:27 } +2024-07-25 22:29:38,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1543/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 1.3237083e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:38,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.44002 samples/s/p 2:41:19 } +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1545/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.32309315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:41,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43433 samples/s/p 2:41:26 } +2024-07-25 22:29:44,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1547/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.3224778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:44,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43156 samples/s/p 2:41:28 } +2024-07-25 22:29:47,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1549/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.3218627e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:47,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43287 samples/s/p 2:41:23 } +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1551/ 1625], loss: 1.002, per_step_time: 1472ms, lr: 1.3212475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.5% |█████████████████████████████ | 5.43376 samples/s/p 2:41:18 } +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1553/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 1.3206322e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43628 samples/s/p 2:41:11 } +2024-07-25 22:29:56,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1555/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.3200172e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:56,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43537 samples/s/p 2:41:09 } +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1557/ 1625], loss: 1.169, per_step_time: 1473ms, lr: 1.3194022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:29:59,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43023 samples/s/p 2:41:16 } +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1559/ 1625], loss: 1.376, per_step_time: 1474ms, lr: 1.31878705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:01,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42509 samples/s/p 2:41:22 } +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1561/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 1.3181722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:04,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42874 samples/s/p 2:41:12 } +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1563/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.3175575e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:07,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43874 samples/s/p 2:40:52 } +2024-07-25 22:30:10,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1565/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.3169424e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:10,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.42755 samples/s/p 2:41:09 } +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1567/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.3163276e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:13,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.6% |█████████████████████████████ | 5.43009 samples/s/p 2:41:01 } +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1569/ 1625], loss: 0.974, per_step_time: 1472ms, lr: 1.315713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:16,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43241 samples/s/p 2:40:54 } +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1571/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.3150981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:19,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43832 samples/s/p 2:40:41 } +2024-07-25 22:30:22,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1573/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.3144833e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:22,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43558 samples/s/p 2:40:43 } +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1575/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.3138689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:25,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43570 samples/s/p 2:40:39 } +2024-07-25 22:30:28,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1577/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.3132543e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:28,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43661 samples/s/p 2:40:35 } +2024-07-25 22:30:31,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1579/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.3126396e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:31,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43466 samples/s/p 2:40:35 } +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1581/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.31202505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:34,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.43200 samples/s/p 2:40:37 } +2024-07-25 22:30:37,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1583/ 1625], loss: 1.098, per_step_time: 1473ms, lr: 1.3114108e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:37,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.7% |█████████████████████████████ | 5.42792 samples/s/p 2:40:41 } +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1585/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.3107961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:40,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43439 samples/s/p 2:40:27 } +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1587/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3101817e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:43,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43408 samples/s/p 2:40:25 } +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1589/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 1.3095676e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:46,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43835 samples/s/p 2:40:14 } +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1591/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 1.30895305e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:49,214 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43594 samples/s/p 2:40:16 } +2024-07-25 22:30:52,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1593/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 1.3083389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:52,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.42245 samples/s/p 2:40:36 } +2024-07-25 22:30:55,123 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1595/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.3077247e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:55,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43291 samples/s/p 2:40:15 } +2024-07-25 22:30:58,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1597/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.3071103e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:30:58,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43430 samples/s/p 2:40:10 } +2024-07-25 22:31:01,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1599/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 1.3064964e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:01,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.8% |█████████████████████████████ | 5.43043 samples/s/p 2:40:13 } +2024-07-25 22:31:03,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1601/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.3058823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:03,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43295 samples/s/p 2:40:06 } +2024-07-25 22:31:06,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1603/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.30526805e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:06,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.44023 samples/s/p 2:39:50 } +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1605/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.3046542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:09,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43469 samples/s/p 2:39:57 } +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1607/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3040404e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:12,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43344 samples/s/p 2:39:56 } +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1609/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 1.3034263e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:15,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43280 samples/s/p 2:39:55 } +2024-07-25 22:31:18,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1611/ 1625], loss: 1.346, per_step_time: 1472ms, lr: 1.3028125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:18,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43358 samples/s/p 2:39:50 } +2024-07-25 22:31:21,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1613/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.3021988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:21,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43437 samples/s/p 2:39:46 } +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1615/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 1.301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:24,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 59.9% |█████████████████████████████ | 5.43531 samples/s/p 2:39:41 } +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1617/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 1.3009712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:27,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43980 samples/s/p 2:39:30 } +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1619/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.3003577e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:30,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.42978 samples/s/p 2:39:45 } +2024-07-25 22:31:33,491 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1621/ 1625], loss: 1.197, per_step_time: 1473ms, lr: 1.2997442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:33,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43044 samples/s/p 2:39:41 } +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1623/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.2991304e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:36,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |█████████████████████████████ | 5.43760 samples/s/p 2:39:25 } +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 6/ 10], step:[ 1625/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.2985169e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:39,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43102 samples/s/p 2:39:34 } +2024-07-25 22:31:42,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 2/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 1.2979036e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:42,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43671 samples/s/p 2:39:21 } +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 4/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 1.29729e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:45,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43933 samples/s/p 2:39:14 } +2024-07-25 22:31:48,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 6/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 1.2966765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:48,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.43562 samples/s/p 2:39:17 } +2024-07-25 22:31:51,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 8/ 1625], loss: 1.054, per_step_time: 1470ms, lr: 1.2960634e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:51,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.0% |██████████████████████████████ | 5.44061 samples/s/p 2:39:05 } +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 10/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.2954499e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:54,140 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43745 samples/s/p 2:39:08 } +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 12/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2948367e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:31:57,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44000 samples/s/p 2:39:01 } +2024-07-25 22:32:00,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 14/ 1625], loss: 1.305, per_step_time: 1469ms, lr: 1.2942235e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:00,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.44271 samples/s/p 2:38:53 } +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 16/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 1.2936102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:02,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43532 samples/s/p 2:39:03 } +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 18/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.2929972e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:05,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43824 samples/s/p 2:38:55 } +2024-07-25 22:32:08,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 20/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.29238415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:08,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43558 samples/s/p 2:38:57 } +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 22/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 1.2917709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:11,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43250 samples/s/p 2:38:59 } +2024-07-25 22:32:14,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 24/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 1.29115815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:14,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.1% |██████████████████████████████ | 5.43513 samples/s/p 2:38:52 } +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 26/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.2905453e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:17,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43290 samples/s/p 2:38:53 } +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 28/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.2899323e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:20,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43711 samples/s/p 2:38:42 } +2024-07-25 22:32:23,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 30/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2893195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:23,642 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43382 samples/s/p 2:38:45 } +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 32/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.2887069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:26,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43600 samples/s/p 2:38:38 } +2024-07-25 22:32:29,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 34/ 1625], loss: 1.296, per_step_time: 1473ms, lr: 1.288094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:29,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.42981 samples/s/p 2:38:46 } +2024-07-25 22:32:32,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 36/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.28748125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:32,497 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.43494 samples/s/p 2:38:34 } +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 38/ 1625], loss: 1.306, per_step_time: 1473ms, lr: 1.2868688e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:35,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.42956 samples/s/p 2:38:41 } +2024-07-25 22:32:38,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 40/ 1625], loss: 1.321, per_step_time: 1470ms, lr: 1.286256e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:38,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.2% |██████████████████████████████ | 5.44047 samples/s/p 2:38:19 } +2024-07-25 22:32:41,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 42/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.2856436e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:41,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43285 samples/s/p 2:38:29 } +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 44/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.2850312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:44,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43565 samples/s/p 2:38:21 } +2024-07-25 22:32:47,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 46/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.2844189e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:47,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43750 samples/s/p 2:38:15 } +2024-07-25 22:32:50,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 48/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.2838063e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:50,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43449 samples/s/p 2:38:17 } +2024-07-25 22:32:53,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 50/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 1.2831941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43004 samples/s/p 2:38:22 } +2024-07-25 22:32:53,156 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 52/ 1625], loss: 1.058, per_step_time: 2244ms, lr: 1.2825818e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:28,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 3.56388 samples/s/p 4:01:14 } +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 54/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2819694e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:31,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43172 samples/s/p 2:38:13 } +2024-07-25 22:33:34,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 56/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.2813573e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:34,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.3% |██████████████████████████████ | 5.43021 samples/s/p 2:38:13 } +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 58/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.2807452e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:37,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43170 samples/s/p 2:38:08 } +2024-07-25 22:33:40,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 60/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.280133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:40,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43159 samples/s/p 2:38:05 } +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 62/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 1.2795211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:43,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43181 samples/s/p 2:38:01 } +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 64/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.2789093e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:46,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43849 samples/s/p 2:37:47 } +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 66/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 1.2782971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43318 samples/s/p 2:37:53 } +2024-07-25 22:33:52,557 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 68/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2776852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:52,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43253 samples/s/p 2:37:51 } +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 70/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 1.2770735e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:55,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.43496 samples/s/p 2:37:44 } +2024-07-25 22:33:58,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 72/ 1625], loss: 1.026, per_step_time: 1469ms, lr: 1.2764615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:33:58,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.4% |██████████████████████████████ | 5.44439 samples/s/p 2:37:25 } +2024-07-25 22:34:01,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 74/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 1.2758497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:01,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43692 samples/s/p 2:37:35 } +2024-07-25 22:34:04,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 76/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 1.2752383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:04,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43827 samples/s/p 2:37:30 } +2024-07-25 22:34:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 78/ 1625], loss: 1.090, per_step_time: 1474ms, lr: 1.27462645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:07,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.42664 samples/s/p 2:37:47 } +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 80/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.274015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43786 samples/s/p 2:37:24 } +2024-07-25 22:34:13,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 82/ 1625], loss: 1.343, per_step_time: 1470ms, lr: 1.27340345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:13,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43858 samples/s/p 2:37:20 } +2024-07-25 22:34:16,158 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 84/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.2727917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:16,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43291 samples/s/p 2:37:27 } +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 86/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 1.27218045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:19,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43236 samples/s/p 2:37:25 } +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 88/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.2715691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:22,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.5% |██████████████████████████████ | 5.43487 samples/s/p 2:37:18 } +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 90/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.27095755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:25,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43263 samples/s/p 2:37:19 } +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 92/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.2703464e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:27,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43818 samples/s/p 2:37:06 } +2024-07-25 22:34:30,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 94/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.2697354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:30,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43706 samples/s/p 2:37:05 } +2024-07-25 22:34:33,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 96/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.2691242e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:33,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43353 samples/s/p 2:37:08 } +2024-07-25 22:34:36,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 98/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 1.2685128e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:37,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43440 samples/s/p 2:37:04 } +2024-07-25 22:34:40,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 100/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.2679019e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:40,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43813 samples/s/p 2:36:54 } +2024-07-25 22:34:43,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 102/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.2672909e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:43,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.43254 samples/s/p 2:37:01 } +2024-07-25 22:34:46,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 104/ 1625], loss: 0.993, per_step_time: 1470ms, lr: 1.2666797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:46,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.6% |██████████████████████████████ | 5.44038 samples/s/p 2:36:45 } +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.266069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:49,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43379 samples/s/p 2:36:53 } +2024-07-25 22:34:52,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 108/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.2654583e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:52,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43359 samples/s/p 2:36:51 } +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 110/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.2648473e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:55,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43883 samples/s/p 2:36:39 } +2024-07-25 22:34:57,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 112/ 1625], loss: 1.006, per_step_time: 1472ms, lr: 1.2642366e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:34:57,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43195 samples/s/p 2:36:48 } +2024-07-25 22:35:00,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 114/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.263626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:00,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43339 samples/s/p 2:36:42 } +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 116/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 1.2630152e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:03,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43970 samples/s/p 2:36:28 } +2024-07-25 22:35:06,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 118/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2624045e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:06,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.43350 samples/s/p 2:36:36 } +2024-07-25 22:35:09,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 120/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.2617941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:09,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.7% |██████████████████████████████ | 5.42850 samples/s/p 2:36:42 } +2024-07-25 22:35:12,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 122/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.2611835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:12,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43507 samples/s/p 2:36:27 } +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 124/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.2605732e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:15,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43225 samples/s/p 2:36:29 } +2024-07-25 22:35:18,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 126/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.2599628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:18,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43692 samples/s/p 2:36:18 } +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 128/ 1625], loss: 0.983, per_step_time: 1471ms, lr: 1.2593522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:21,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43585 samples/s/p 2:36:17 } +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 130/ 1625], loss: 0.971, per_step_time: 1470ms, lr: 1.2587421e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:24,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43999 samples/s/p 2:36:07 } +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 132/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 1.25813185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:27,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43635 samples/s/p 2:36:10 } +2024-07-25 22:35:30,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 134/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.2575216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:30,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43563 samples/s/p 2:36:09 } +2024-07-25 22:35:33,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 136/ 1625], loss: 0.975, per_step_time: 1472ms, lr: 1.2569116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:33,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43455 samples/s/p 2:36:08 } +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 138/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.2563017e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:36,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.8% |██████████████████████████████ | 5.43136 samples/s/p 2:36:10 } +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 140/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.2556915e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:39,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43645 samples/s/p 2:35:59 } +2024-07-25 22:35:42,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 142/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.2550816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:42,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43972 samples/s/p 2:35:50 } +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 144/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2544717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:45,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43162 samples/s/p 2:36:01 } +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 146/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.2538619e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:48,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43444 samples/s/p 2:35:53 } +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 148/ 1625], loss: 1.145, per_step_time: 1470ms, lr: 1.2532519e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:51,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43988 samples/s/p 2:35:41 } +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 150/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.2526423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:54,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43147 samples/s/p 2:35:52 } +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 152/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 1.2520328e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:56,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43478 samples/s/p 2:35:44 } +2024-07-25 22:35:59,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 154/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.2514231e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:35:59,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 60.9% |██████████████████████████████ | 5.43365 samples/s/p 2:35:43 } +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 156/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 1.2508134e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:02,887 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43702 samples/s/p 2:35:34 } +2024-07-25 22:36:05,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 158/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 1.2502041e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:05,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43319 samples/s/p 2:35:38 } +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 160/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.2495944e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:08,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43190 samples/s/p 2:35:37 } +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 162/ 1625], loss: 1.198, per_step_time: 1470ms, lr: 1.248985e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:11,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43961 samples/s/p 2:35:21 } +2024-07-25 22:36:14,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 164/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.2483758e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:14,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42803 samples/s/p 2:35:38 } +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 166/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.2477663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:17,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43193 samples/s/p 2:35:28 } +2024-07-25 22:36:20,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 168/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.24715725e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:20,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.43334 samples/s/p 2:35:23 } +2024-07-25 22:36:23,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 170/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.2465481e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:23,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.0% |██████████████████████████████ | 5.42783 samples/s/p 2:35:29 } +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 172/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.2459387e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:26,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43170 samples/s/p 2:35:20 } +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 174/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.2453298e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:29,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43432 samples/s/p 2:35:12 } +2024-07-25 22:36:32,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 176/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.2447208e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:32,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43337 samples/s/p 2:35:11 } +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 178/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 1.2441116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:35,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.42916 samples/s/p 2:35:15 } +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 180/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2435029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:38,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43740 samples/s/p 2:34:58 } +2024-07-25 22:36:41,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 182/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.2428942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:41,265 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43324 samples/s/p 2:35:02 } +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 184/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.2422852e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:44,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43592 samples/s/p 2:34:55 } +2024-07-25 22:36:47,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 186/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.24167655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:47,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.1% |██████████████████████████████ | 5.43519 samples/s/p 2:34:53 } +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 188/ 1625], loss: 1.239, per_step_time: 1470ms, lr: 1.241068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:50,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43921 samples/s/p 2:34:43 } +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 190/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.2404592e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:53,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43215 samples/s/p 2:34:52 } +2024-07-25 22:36:56,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 192/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.23985055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:56,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43200 samples/s/p 2:34:50 } +2024-07-25 22:36:58,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 194/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 1.2392423e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:36:58,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43802 samples/s/p 2:34:36 } +2024-07-25 22:37:01,917 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 196/ 1625], loss: 0.987, per_step_time: 1471ms, lr: 1.2386339e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:01,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43631 samples/s/p 2:34:36 } +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 198/ 1625], loss: 1.417, per_step_time: 1473ms, lr: 1.2380254e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:04,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43028 samples/s/p 2:34:44 } +2024-07-25 22:37:07,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 200/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 1.237417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:07,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43728 samples/s/p 2:34:29 } +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 202/ 1625], loss: 1.109, per_step_time: 1470ms, lr: 1.2368088e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:10,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.2% |██████████████████████████████ | 5.43903 samples/s/p 2:34:23 } +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 204/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2362005e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:13,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43138 samples/s/p 2:34:33 } +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 206/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.2355923e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:16,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43611 samples/s/p 2:34:22 } +2024-07-25 22:37:19,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 208/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2349844e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:19,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.44074 samples/s/p 2:34:11 } +2024-07-25 22:37:22,571 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 210/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.2343762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:22,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43341 samples/s/p 2:34:21 } +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 212/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.2337684e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:25,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.43545 samples/s/p 2:34:14 } +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 214/ 1625], loss: 1.160, per_step_time: 1474ms, lr: 1.2331604e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:28,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42585 samples/s/p 2:34:28 } +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 216/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.2325523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:31,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42998 samples/s/p 2:34:18 } +2024-07-25 22:37:34,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 218/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 1.2319448e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:34,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.3% |██████████████████████████████ | 5.42611 samples/s/p 2:34:21 } +2024-07-25 22:37:37,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 220/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.2313371e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:37,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43528 samples/s/p 2:34:03 } +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 222/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 1.2307292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:40,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.42846 samples/s/p 2:34:11 } +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 224/ 1625], loss: 0.964, per_step_time: 1483ms, lr: 1.2301216e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:43,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.39224 samples/s/p 2:35:11 } +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 226/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.22951415e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:46,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43619 samples/s/p 2:33:52 } +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 228/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 1.2289065e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:49,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.44316 samples/s/p 2:33:38 } +2024-07-25 22:37:52,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 230/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.2282991e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:52,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43611 samples/s/p 2:33:47 } +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 232/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.2276918e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:55,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43766 samples/s/p 2:33:41 } +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 234/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2270843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:37:58,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.4% |██████████████████████████████ | 5.43341 samples/s/p 2:33:45 } +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 236/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 1.2264772e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:00,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.44184 samples/s/p 2:33:28 } +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 238/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.2258699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:03,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43260 samples/s/p 2:33:41 } +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 240/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2252626e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:06,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43125 samples/s/p 2:33:40 } +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 242/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2246556e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:09,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43796 samples/s/p 2:33:26 } +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 244/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 1.2240485e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:12,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43454 samples/s/p 2:33:29 } +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 246/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.2234417e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:15,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43068 samples/s/p 2:33:32 } +2024-07-25 22:38:18,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 248/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.2228347e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:18,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43771 samples/s/p 2:33:17 } +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 250/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.222228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:21,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.5% |██████████████████████████████ | 5.43490 samples/s/p 2:33:19 } +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 252/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.2216211e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:24,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43291 samples/s/p 2:33:20 } +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 254/ 1625], loss: 1.171, per_step_time: 1485ms, lr: 1.2210142e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:27,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.38615 samples/s/p 2:34:37 } +2024-07-25 22:38:30,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 256/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.22040765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:30,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43711 samples/s/p 2:33:07 } +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 258/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 1.2198011e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:33,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43305 samples/s/p 2:33:11 } +2024-07-25 22:38:36,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 260/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.2191943e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:36,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43797 samples/s/p 2:32:59 } +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 262/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.218588e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:39,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43242 samples/s/p 2:33:06 } +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 264/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.21798175e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:42,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43651 samples/s/p 2:32:56 } +2024-07-25 22:38:45,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 266/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 1.2173752e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:45,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43012 samples/s/p 2:33:04 } +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 268/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.2167689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:48,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.6% |██████████████████████████████ | 5.43845 samples/s/p 2:32:47 } +2024-07-25 22:38:51,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 270/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.2161628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:51,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.44151 samples/s/p 2:32:39 } +2024-07-25 22:38:54,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 272/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.2155563e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:54,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43507 samples/s/p 2:32:47 } +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 274/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.2149503e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:38:57,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43151 samples/s/p 2:32:50 } +2024-07-25 22:39:00,006 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 276/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.2143444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:00,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43836 samples/s/p 2:32:35 } +2024-07-25 22:39:02,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 278/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.2137382e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:02,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43605 samples/s/p 2:32:36 } +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 280/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.2131324e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:05,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43856 samples/s/p 2:32:29 } +2024-07-25 22:39:08,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 282/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 1.2125265e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:08,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43558 samples/s/p 2:32:31 } +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 284/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.2119205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:11,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.7% |██████████████████████████████ | 5.43608 samples/s/p 2:32:27 } +2024-07-25 22:39:14,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 286/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 1.2113149e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:14,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42761 samples/s/p 2:32:39 } +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 288/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.2107092e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:17,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42990 samples/s/p 2:32:32 } +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 290/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 1.2101034e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:20,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43180 samples/s/p 2:32:26 } +2024-07-25 22:39:23,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 292/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 1.209498e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:23,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43439 samples/s/p 2:32:18 } +2024-07-25 22:39:26,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 294/ 1625], loss: 1.100, per_step_time: 1474ms, lr: 1.2088927e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:26,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.42684 samples/s/p 2:32:28 } +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 296/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2082872e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:29,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43608 samples/s/p 2:32:10 } +2024-07-25 22:39:32,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 298/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.2076816e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:32,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43191 samples/s/p 2:32:14 } +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 300/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 1.20707655e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:35,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.8% |██████████████████████████████ | 5.43665 samples/s/p 2:32:03 } +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 302/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 1.2064713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:38,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43511 samples/s/p 2:32:02 } +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 304/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.2058658e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:41,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43671 samples/s/p 2:31:57 } +2024-07-25 22:39:44,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 306/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 1.2052609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:44,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43383 samples/s/p 2:31:59 } +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 308/ 1625], loss: 1.281, per_step_time: 1473ms, lr: 1.204656e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:47,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42983 samples/s/p 2:32:02 } +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 310/ 1625], loss: 1.238, per_step_time: 1469ms, lr: 1.2040508e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:50,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.44238 samples/s/p 2:31:38 } +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 312/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 1.2034459e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:53,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43710 samples/s/p 2:31:44 } +2024-07-25 22:39:56,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 314/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.2028412e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:56,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.43964 samples/s/p 2:31:37 } +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 316/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.2022362e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:39:59,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 61.9% |██████████████████████████████ | 5.42951 samples/s/p 2:31:51 } +2024-07-25 22:40:01,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 318/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.2016315e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:01,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43679 samples/s/p 2:31:36 } +2024-07-25 22:40:04,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 320/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 1.20102695e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:04,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43979 samples/s/p 2:31:28 } +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 322/ 1625], loss: 1.316, per_step_time: 1473ms, lr: 1.2004221e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:07,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.42997 samples/s/p 2:31:42 } +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 324/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.1998178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:10,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |██████████████████████████████ | 5.43199 samples/s/p 2:31:35 } +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 326/ 1625], loss: 1.243, per_step_time: 1471ms, lr: 1.1992133e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:13,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43750 samples/s/p 2:31:23 } +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 328/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.1986087e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:16,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43539 samples/s/p 2:31:24 } +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 330/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1980044e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:19,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.43196 samples/s/p 2:31:26 } +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 332/ 1625], loss: 1.238, per_step_time: 1474ms, lr: 1.1974002e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:22,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.0% |███████████████████████████████ | 5.42739 samples/s/p 2:31:31 } +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 334/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.1967958e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:25,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43300 samples/s/p 2:31:19 } +2024-07-25 22:40:28,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 336/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 1.1961917e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:28,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43366 samples/s/p 2:31:15 } +2024-07-25 22:40:31,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 338/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.1955879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:31,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43667 samples/s/p 2:31:07 } +2024-07-25 22:40:34,448 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 340/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1949837e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:34,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43462 samples/s/p 2:31:07 } +2024-07-25 22:40:37,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 342/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.1943797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:37,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43475 samples/s/p 2:31:04 } +2024-07-25 22:40:40,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 344/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.1937759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:40,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43267 samples/s/p 2:31:05 } +2024-07-25 22:40:43,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 346/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 1.1931721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:43,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43102 samples/s/p 2:31:04 } +2024-07-25 22:40:46,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 348/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1925681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:46,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.1% |███████████████████████████████ | 5.43615 samples/s/p 2:30:53 } +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 1.1919647e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:49,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.42799 samples/s/p 2:31:04 } +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 352/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 1.1913612e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:52,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43317 samples/s/p 2:30:52 } +2024-07-25 22:40:55,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 354/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.1907574e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:55,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43342 samples/s/p 2:30:49 } +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 356/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 1.1901539e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:40:58,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.44233 samples/s/p 2:30:31 } +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 358/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 1.1895506e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:01,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43049 samples/s/p 2:30:48 } +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 360/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.1889471e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:03,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43711 samples/s/p 2:30:34 } +2024-07-25 22:41:06,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 362/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 1.1883438e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:06,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43538 samples/s/p 2:30:34 } +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 364/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.1877407e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:09,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.2% |███████████████████████████████ | 5.43203 samples/s/p 2:30:36 } +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 366/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.1871373e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:12,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43487 samples/s/p 2:30:29 } +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 368/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.1865344e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:15,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43476 samples/s/p 2:30:26 } +2024-07-25 22:41:18,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 370/ 1625], loss: 1.003, per_step_time: 1472ms, lr: 1.1859313e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:18,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43325 samples/s/p 2:30:25 } +2024-07-25 22:41:21,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 372/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.1853283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:21,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43866 samples/s/p 2:30:13 } +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 374/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1847255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:24,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43262 samples/s/p 2:30:21 } +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 376/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.1841228e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:27,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43239 samples/s/p 2:30:18 } +2024-07-25 22:41:30,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 378/ 1625], loss: 1.223, per_step_time: 1473ms, lr: 1.1835199e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:30,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.43100 samples/s/p 2:30:17 } +2024-07-25 22:41:33,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 380/ 1625], loss: 1.070, per_step_time: 1473ms, lr: 1.1829171e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:33,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.3% |███████████████████████████████ | 5.42826 samples/s/p 2:30:19 } +2024-07-25 22:41:36,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 382/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 1.1823147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:36,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43684 samples/s/p 2:30:02 } +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 384/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 1.181712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:39,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.44014 samples/s/p 2:29:53 } +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 386/ 1625], loss: 1.296, per_step_time: 1471ms, lr: 1.1811094e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:42,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43583 samples/s/p 2:29:58 } +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 388/ 1625], loss: 1.060, per_step_time: 1468ms, lr: 1.1805072e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:45,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.44621 samples/s/p 2:29:37 } +2024-07-25 22:41:48,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 390/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.1799047e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:48,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43324 samples/s/p 2:29:56 } +2024-07-25 22:41:51,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 392/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.1793026e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:51,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43628 samples/s/p 2:29:48 } +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 394/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 1.1787003e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:54,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43412 samples/s/p 2:29:49 } +2024-07-25 22:41:57,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 396/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.1780983e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:41:57,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43396 samples/s/p 2:29:46 } +2024-07-25 22:42:00,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 398/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.1774961e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:00,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.4% |███████████████████████████████ | 5.43214 samples/s/p 2:29:46 } +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 400/ 1625], loss: 1.342, per_step_time: 1472ms, lr: 1.1768941e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:02,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43140 samples/s/p 2:29:44 } +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 402/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.17629215e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:05,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43694 samples/s/p 2:29:32 } +2024-07-25 22:42:08,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 404/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.17569025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:08,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43509 samples/s/p 2:29:32 } +2024-07-25 22:42:11,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 406/ 1625], loss: 1.292, per_step_time: 1472ms, lr: 1.1750886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:11,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43241 samples/s/p 2:29:34 } +2024-07-25 22:42:14,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 408/ 1625], loss: 1.109, per_step_time: 1469ms, lr: 1.1744868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:14,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44265 samples/s/p 2:29:14 } +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 410/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.173885e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:17,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.44034 samples/s/p 2:29:15 } +2024-07-25 22:42:20,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 412/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.17328345e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:20,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43240 samples/s/p 2:29:25 } +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 414/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1726819e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:23,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.5% |███████████████████████████████ | 5.43333 samples/s/p 2:29:20 } +2024-07-25 22:42:26,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 416/ 1625], loss: 1.134, per_step_time: 1482ms, lr: 1.1720804e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:26,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.39651 samples/s/p 2:30:19 } +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 418/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 1.1714791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:29,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43602 samples/s/p 2:29:10 } +2024-07-25 22:42:32,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 420/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 1.1708779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:32,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.42769 samples/s/p 2:29:21 } +2024-07-25 22:42:35,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 422/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 1.1702766e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:35,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43114 samples/s/p 2:29:12 } +2024-07-25 22:42:38,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 424/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.1696753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:38,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43651 samples/s/p 2:29:01 } +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 426/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1690743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:41,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43367 samples/s/p 2:29:02 } +2024-07-25 22:42:44,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 428/ 1625], loss: 1.312, per_step_time: 1477ms, lr: 1.1684731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:44,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.41612 samples/s/p 2:29:28 } +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 430/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.1678721e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:47,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.6% |███████████████████████████████ | 5.43924 samples/s/p 2:28:47 } +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 432/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.1672715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:50,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43494 samples/s/p 2:28:51 } +2024-07-25 22:42:53,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 434/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.1666704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:53,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43327 samples/s/p 2:28:51 } +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 436/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 1.1660698e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:56,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43392 samples/s/p 2:28:47 } +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 438/ 1625], loss: 1.297, per_step_time: 1472ms, lr: 1.1654692e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:42:59,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43408 samples/s/p 2:28:44 } +2024-07-25 22:43:02,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 440/ 1625], loss: 1.124, per_step_time: 1471ms, lr: 1.16486835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:02,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43553 samples/s/p 2:28:39 } +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 442/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.164268e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:04,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43772 samples/s/p 2:28:32 } +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 444/ 1625], loss: 0.998, per_step_time: 1471ms, lr: 1.1636675e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:07,930 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43603 samples/s/p 2:28:32 } +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 446/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.1630674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:10,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.7% |███████████████████████████████ | 5.43409 samples/s/p 2:28:32 } +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 448/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 1.1624667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:13,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43261 samples/s/p 2:28:32 } +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 450/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 1.1618667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:16,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43339 samples/s/p 2:28:27 } +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 452/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.1612665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:19,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43500 samples/s/p 2:28:22 } +2024-07-25 22:43:22,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 454/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 1.1606662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:22,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43929 samples/s/p 2:28:12 } +2024-07-25 22:43:25,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 456/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.1600662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:25,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.44052 samples/s/p 2:28:07 } +2024-07-25 22:43:28,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 458/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 1.1594662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:28,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43300 samples/s/p 2:28:16 } +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 460/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.1588663e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:31,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43775 samples/s/p 2:28:06 } +2024-07-25 22:43:34,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 462/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 1.1582666e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:34,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.8% |███████████████████████████████ | 5.43764 samples/s/p 2:28:03 } +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 464/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.157667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:37,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44104 samples/s/p 2:27:54 } +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 466/ 1625], loss: 1.144, per_step_time: 1470ms, lr: 1.1570671e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:40,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44103 samples/s/p 2:27:51 } +2024-07-25 22:43:43,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 468/ 1625], loss: 1.305, per_step_time: 1474ms, lr: 1.1564674e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:43,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42487 samples/s/p 2:28:15 } +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 470/ 1625], loss: 1.021, per_step_time: 1469ms, lr: 1.1558682e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:46,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.44223 samples/s/p 2:27:44 } +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 472/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.15526855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:49,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43270 samples/s/p 2:27:56 } +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 474/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.1546691e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:52,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43488 samples/s/p 2:27:50 } +2024-07-25 22:43:55,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 476/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.1540699e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:55,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.42968 samples/s/p 2:27:55 } +2024-07-25 22:43:58,088 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 478/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 1.1534705e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:43:58,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 62.9% |███████████████████████████████ | 5.43740 samples/s/p 2:27:40 } +2024-07-25 22:44:01,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 480/ 1625], loss: 1.042, per_step_time: 1471ms, lr: 1.1528715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:01,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43555 samples/s/p 2:27:40 } +2024-07-25 22:44:03,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 482/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 1.1522724e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:03,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43698 samples/s/p 2:27:34 } +2024-07-25 22:44:06,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 484/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.1516731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:06,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43983 samples/s/p 2:27:27 } +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 486/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 1.1510744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:09,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43360 samples/s/p 2:27:34 } +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 488/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 1.1504755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:12,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43921 samples/s/p 2:27:22 } +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 490/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1498765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:15,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43270 samples/s/p 2:27:30 } +2024-07-25 22:44:18,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 492/ 1625], loss: 1.266, per_step_time: 1473ms, lr: 1.149278e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:18,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.42868 samples/s/p 2:27:33 } +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 494/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 1.1486794e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:21,696 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.0% |███████████████████████████████ | 5.43036 samples/s/p 2:27:28 } +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 496/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.1480808e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:24,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43417 samples/s/p 2:27:18 } +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 498/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.1474822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:27,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42866 samples/s/p 2:27:24 } +2024-07-25 22:44:30,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 500/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 1.1468839e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:30,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42997 samples/s/p 2:27:19 } +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 502/ 1625], loss: 1.107, per_step_time: 1473ms, lr: 1.1462855e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:33,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42806 samples/s/p 2:27:19 } +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 504/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.1456871e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:36,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42918 samples/s/p 2:27:15 } +2024-07-25 22:44:39,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 506/ 1625], loss: 1.135, per_step_time: 1482ms, lr: 1.145089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:39,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.39791 samples/s/p 2:28:03 } +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 508/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 1.144491e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:42,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.42910 samples/s/p 2:27:09 } +2024-07-25 22:44:45,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 510/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.1438929e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:45,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.1% |███████████████████████████████ | 5.43343 samples/s/p 2:26:59 } +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 512/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.1432948e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:48,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43750 samples/s/p 2:26:49 } +2024-07-25 22:44:51,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 514/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1426971e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:51,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43346 samples/s/p 2:26:53 } +2024-07-25 22:44:54,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 516/ 1625], loss: 1.334, per_step_time: 1470ms, lr: 1.142099e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:54,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44159 samples/s/p 2:26:37 } +2024-07-25 22:44:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 518/ 1625], loss: 1.101, per_step_time: 1469ms, lr: 1.14150125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:44:57,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.44247 samples/s/p 2:26:33 } +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 520/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.1409037e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:00,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43632 samples/s/p 2:26:40 } +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 522/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.140306e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:03,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43831 samples/s/p 2:26:33 } +2024-07-25 22:45:05,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 524/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.1397086e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:05,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43784 samples/s/p 2:26:31 } +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 526/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 1.1391111e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:08,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43387 samples/s/p 2:26:35 } +2024-07-25 22:45:11,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 528/ 1625], loss: 1.398, per_step_time: 1471ms, lr: 1.1385136e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:11,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.2% |███████████████████████████████ | 5.43738 samples/s/p 2:26:26 } +2024-07-25 22:45:14,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 530/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.1379165e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:14,834 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44011 samples/s/p 2:26:19 } +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 532/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.1373192e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:17,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43917 samples/s/p 2:26:17 } +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 534/ 1625], loss: 1.329, per_step_time: 1471ms, lr: 1.136722e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:20,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43562 samples/s/p 2:26:20 } +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 536/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.136125e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:23,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43310 samples/s/p 2:26:21 } +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 538/ 1625], loss: 1.158, per_step_time: 1474ms, lr: 1.13552815e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:26,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.42703 samples/s/p 2:26:28 } +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 540/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.134931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:29,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43167 samples/s/p 2:26:18 } +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 542/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.1343341e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:32,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.44175 samples/s/p 2:25:58 } +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 544/ 1625], loss: 1.318, per_step_time: 1472ms, lr: 1.1337375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:35,492 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.3% |███████████████████████████████ | 5.43290 samples/s/p 2:26:10 } +2024-07-25 22:45:38,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 546/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.1331409e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:38,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43003 samples/s/p 2:26:11 } +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 548/ 1625], loss: 1.302, per_step_time: 1471ms, lr: 1.1325442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:41,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43736 samples/s/p 2:25:57 } +2024-07-25 22:45:44,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 550/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 1.13194765e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:44,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43108 samples/s/p 2:26:04 } +2024-07-25 22:45:47,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 552/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.1313513e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:47,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43837 samples/s/p 2:25:49 } +2024-07-25 22:45:50,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 554/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.13075475e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:50,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43454 samples/s/p 2:25:52 } +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 556/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.1301585e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:53,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43718 samples/s/p 2:25:45 } +2024-07-25 22:45:56,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 558/ 1625], loss: 1.312, per_step_time: 1473ms, lr: 1.1295624e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:56,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.42993 samples/s/p 2:25:54 } +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 560/ 1625], loss: 1.206, per_step_time: 1472ms, lr: 1.1289661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:45:59,102 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.4% |███████████████████████████████ | 5.43306 samples/s/p 2:25:46 } +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 562/ 1625], loss: 1.105, per_step_time: 1470ms, lr: 1.12837015e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:02,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.44140 samples/s/p 2:25:30 } +2024-07-25 22:46:05,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 564/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 1.1277741e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:05,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43323 samples/s/p 2:25:40 } +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 566/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 1.127178e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:07,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43322 samples/s/p 2:25:37 } +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 568/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.1265823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:10,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43816 samples/s/p 2:25:26 } +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 570/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 1.1259866e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:13,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43658 samples/s/p 2:25:26 } +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 572/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 1.1253907e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:16,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43455 samples/s/p 2:25:26 } +2024-07-25 22:46:19,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 574/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.1247953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:19,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43779 samples/s/p 2:25:18 } +2024-07-25 22:46:22,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 576/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.1241998e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:22,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.5% |███████████████████████████████ | 5.43648 samples/s/p 2:25:17 } +2024-07-25 22:46:25,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 578/ 1625], loss: 1.229, per_step_time: 1474ms, lr: 1.1236043e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:25,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42699 samples/s/p 2:25:29 } +2024-07-25 22:46:28,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 580/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.1230089e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:28,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43449 samples/s/p 2:25:14 } +2024-07-25 22:46:31,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 582/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 1.1224138e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:31,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.42755 samples/s/p 2:25:22 } +2024-07-25 22:46:34,514 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 584/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 1.1218183e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:34,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43552 samples/s/p 2:25:07 } +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 586/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.12122325e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:37,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43159 samples/s/p 2:25:10 } +2024-07-25 22:46:40,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 588/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.12062835e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:40,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43740 samples/s/p 2:24:58 } +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 590/ 1625], loss: 1.133, per_step_time: 1473ms, lr: 1.1200332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:43,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43101 samples/s/p 2:25:05 } +2024-07-25 22:46:46,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 592/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 1.1194385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:46,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.6% |███████████████████████████████ | 5.43499 samples/s/p 2:24:56 } +2024-07-25 22:46:49,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 594/ 1625], loss: 0.902, per_step_time: 1469ms, lr: 1.11884365e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:49,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44500 samples/s/p 2:24:37 } +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 596/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.118249e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:52,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43661 samples/s/p 2:24:47 } +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 598/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.1176542e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:55,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43912 samples/s/p 2:24:40 } +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 600/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.1170596e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:46:58,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43076 samples/s/p 2:24:51 } +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 602/ 1625], loss: 1.317, per_step_time: 1474ms, lr: 1.1164652e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:01,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42617 samples/s/p 2:24:55 } +2024-07-25 22:47:04,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 604/ 1625], loss: 1.273, per_step_time: 1473ms, lr: 1.1158707e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:04,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.42999 samples/s/p 2:24:46 } +2024-07-25 22:47:06,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 606/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.1152764e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:06,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.43954 samples/s/p 2:24:28 } +2024-07-25 22:47:09,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 608/ 1625], loss: 1.287, per_step_time: 1470ms, lr: 1.1146822e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:09,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.7% |███████████████████████████████ | 5.44057 samples/s/p 2:24:23 } +2024-07-25 22:47:12,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 610/ 1625], loss: 1.255, per_step_time: 1472ms, lr: 1.1140879e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:12,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43193 samples/s/p 2:24:34 } +2024-07-25 22:47:15,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 612/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.1134939e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:15,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43681 samples/s/p 2:24:23 } +2024-07-25 22:47:18,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 614/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.1128999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:18,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43634 samples/s/p 2:24:21 } +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 616/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.1123058e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:21,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43301 samples/s/p 2:24:24 } +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 618/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.111712e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:24,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43330 samples/s/p 2:24:20 } +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 620/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.1111185e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:27,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43318 samples/s/p 2:24:17 } +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 622/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 1.1105246e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:30,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43881 samples/s/p 2:24:06 } +2024-07-25 22:47:33,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 624/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 1.109931e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:33,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.8% |███████████████████████████████ | 5.43534 samples/s/p 2:24:08 } +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 626/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.1093375e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:36,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43175 samples/s/p 2:24:11 } +2024-07-25 22:47:39,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 628/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.108744e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:39,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43162 samples/s/p 2:24:08 } +2024-07-25 22:47:42,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 630/ 1625], loss: 0.976, per_step_time: 1470ms, lr: 1.1081505e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:42,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.44184 samples/s/p 2:23:49 } +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 632/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 1.10755755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:45,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43570 samples/s/p 2:23:56 } +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 634/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 1.1069641e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:48,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43426 samples/s/p 2:23:55 } +2024-07-25 22:47:51,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 636/ 1625], loss: 1.036, per_step_time: 1471ms, lr: 1.1063711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:51,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43546 samples/s/p 2:23:50 } +2024-07-25 22:47:54,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 638/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.105778e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:54,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43925 samples/s/p 2:23:41 } +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 640/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.10518495e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:47:57,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 63.9% |███████████████████████████████ | 5.43535 samples/s/p 2:23:45 } +2024-07-25 22:48:00,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 642/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 1.1045922e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:00,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43229 samples/s/p 2:23:46 } +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 644/ 1625], loss: 1.153, per_step_time: 1482ms, lr: 1.1039994e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:03,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.39478 samples/s/p 2:24:43 } +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 646/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 1.1034069e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:06,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.43454 samples/s/p 2:23:37 } +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 648/ 1625], loss: 1.085, per_step_time: 1469ms, lr: 1.1028141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:08,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |███████████████████████████████ | 5.44440 samples/s/p 2:23:18 } +2024-07-25 22:48:11,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 650/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 1.1022217e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:11,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43711 samples/s/p 2:23:27 } +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 652/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.1016292e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:14,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43244 samples/s/p 2:23:31 } +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 654/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.10103665e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:17,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43014 samples/s/p 2:23:32 } +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 656/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 1.1004445e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:20,761 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43873 samples/s/p 2:23:16 } +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 658/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.0998522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:23,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.0% |████████████████████████████████ | 5.43256 samples/s/p 2:23:22 } +2024-07-25 22:48:26,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 660/ 1625], loss: 1.096, per_step_time: 1472ms, lr: 1.09926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:26,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43358 samples/s/p 2:23:18 } +2024-07-25 22:48:29,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 662/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.098668e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:29,614 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43827 samples/s/p 2:23:08 } +2024-07-25 22:48:32,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 664/ 1625], loss: 1.258, per_step_time: 1472ms, lr: 1.0980762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:32,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43399 samples/s/p 2:23:11 } +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 666/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 1.0974843e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:35,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43360 samples/s/p 2:23:09 } +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 668/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.0968924e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:38,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43721 samples/s/p 2:23:00 } +2024-07-25 22:48:41,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 670/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.0963008e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:41,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.44065 samples/s/p 2:22:52 } +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 672/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 1.095709e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:44,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.42994 samples/s/p 2:23:06 } +2024-07-25 22:48:47,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 674/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 1.0951174e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:47,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.1% |████████████████████████████████ | 5.43462 samples/s/p 2:22:56 } +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 676/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.0945262e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:50,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43637 samples/s/p 2:22:50 } +2024-07-25 22:48:53,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 678/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 1.0939346e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:53,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43662 samples/s/p 2:22:47 } +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 680/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.0933434e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:56,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43372 samples/s/p 2:22:48 } +2024-07-25 22:48:59,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 682/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 1.0927522e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:48:59,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.42958 samples/s/p 2:22:52 } +2024-07-25 22:49:02,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 684/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0921609e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:02,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43535 samples/s/p 2:22:40 } +2024-07-25 22:49:05,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 686/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.0915701e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:05,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43057 samples/s/p 2:22:44 } +2024-07-25 22:49:07,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 688/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.0909791e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:07,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43264 samples/s/p 2:22:38 } +2024-07-25 22:49:10,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 690/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.0903882e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:10,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.2% |████████████████████████████████ | 5.43630 samples/s/p 2:22:29 } +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 692/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.0897974e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:13,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.44013 samples/s/p 2:22:20 } +2024-07-25 22:49:16,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 694/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.08920685e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:16,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43564 samples/s/p 2:22:25 } +2024-07-25 22:49:19,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 696/ 1625], loss: 1.368, per_step_time: 1472ms, lr: 1.088616e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:19,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43452 samples/s/p 2:22:23 } +2024-07-25 22:49:22,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 698/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.0880255e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:22,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43475 samples/s/p 2:22:20 } +2024-07-25 22:49:25,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 700/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 1.0874353e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:25,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43504 samples/s/p 2:22:17 } +2024-07-25 22:49:28,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 702/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.086845e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:28,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43294 samples/s/p 2:22:17 } +2024-07-25 22:49:31,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 704/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0862545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:31,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43459 samples/s/p 2:22:12 } +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 706/ 1625], loss: 1.132, per_step_time: 1473ms, lr: 1.0856644e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:34,539 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.3% |████████████████████████████████ | 5.43028 samples/s/p 2:22:15 } +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 708/ 1625], loss: 1.209, per_step_time: 1473ms, lr: 1.0850745e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:37,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42928 samples/s/p 2:22:14 } +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 710/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 1.0844842e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:40,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43786 samples/s/p 2:21:58 } +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 712/ 1625], loss: 1.160, per_step_time: 1470ms, lr: 1.0838942e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:43,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43855 samples/s/p 2:21:54 } +2024-07-25 22:49:46,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 714/ 1625], loss: 1.252, per_step_time: 1473ms, lr: 1.0833046e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:46,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.42840 samples/s/p 2:22:07 } +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 716/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 1.0827147e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:49,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43390 samples/s/p 2:21:55 } +2024-07-25 22:49:52,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 718/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 1.0821252e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:52,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43676 samples/s/p 2:21:48 } +2024-07-25 22:49:55,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 720/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.08153545e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:55,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.44406 samples/s/p 2:21:33 } +2024-07-25 22:49:58,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 722/ 1625], loss: 1.249, per_step_time: 1471ms, lr: 1.0809458e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:49:58,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.4% |████████████████████████████████ | 5.43778 samples/s/p 2:21:40 } +2024-07-25 22:50:01,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 724/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 1.0803566e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:01,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43084 samples/s/p 2:21:48 } +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 726/ 1625], loss: 0.949, per_step_time: 1472ms, lr: 1.0797673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:04,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43201 samples/s/p 2:21:43 } +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 728/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.0791779e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:06,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43413 samples/s/p 2:21:37 } +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 730/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.0785889e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:09,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43833 samples/s/p 2:21:27 } +2024-07-25 22:50:12,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 732/ 1625], loss: 1.101, per_step_time: 1474ms, lr: 1.0779999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:12,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.42556 samples/s/p 2:21:44 } +2024-07-25 22:50:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 734/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.0774107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43949 samples/s/p 2:21:20 } +2024-07-25 22:50:18,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 736/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 1.0768219e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:18,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.43073 samples/s/p 2:21:30 } +2024-07-25 22:50:21,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 738/ 1625], loss: 1.001, per_step_time: 1470ms, lr: 1.0762332e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:21,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.5% |████████████████████████████████ | 5.44049 samples/s/p 2:21:12 } +2024-07-25 22:50:24,703 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 740/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0756443e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:24,704 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43662 samples/s/p 2:21:15 } +2024-07-25 22:50:27,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 742/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.0750557e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.42925 samples/s/p 2:21:24 } +2024-07-25 22:50:30,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 744/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 1.0744673e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:30,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43666 samples/s/p 2:21:09 } +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 746/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 1.0738787e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:33,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.42908 samples/s/p 2:21:18 } +2024-07-25 22:50:36,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 748/ 1625], loss: 1.258, per_step_time: 1471ms, lr: 1.0732904e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:36,514 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43553 samples/s/p 2:21:05 } +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 750/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0727022e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:39,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43550 samples/s/p 2:21:02 } +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 752/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 1.0721141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:42,416 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43352 samples/s/p 2:21:03 } +2024-07-25 22:50:45,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 754/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0715258e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:45,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.6% |████████████████████████████████ | 5.43546 samples/s/p 2:20:57 } +2024-07-25 22:50:48,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 756/ 1625], loss: 0.860, per_step_time: 1470ms, lr: 1.0709378e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:48,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43895 samples/s/p 2:20:48 } +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 758/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 1.07035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:51,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42867 samples/s/p 2:21:01 } +2024-07-25 22:50:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 760/ 1625], loss: 1.199, per_step_time: 1469ms, lr: 1.069762e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:54,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.44247 samples/s/p 2:20:37 } +2024-07-25 22:50:57,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 762/ 1625], loss: 1.022, per_step_time: 1473ms, lr: 1.0691743e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:50:57,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42919 samples/s/p 2:20:55 } +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 764/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.0685868e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:00,124 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43165 samples/s/p 2:20:48 } +2024-07-25 22:51:03,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 766/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.067999e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:03,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43207 samples/s/p 2:20:44 } +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 768/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.0674116e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:06,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.42949 samples/s/p 2:20:45 } +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 770/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.0668243e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:08,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.7% |████████████████████████████████ | 5.43154 samples/s/p 2:20:39 } +2024-07-25 22:51:11,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 772/ 1625], loss: 1.199, per_step_time: 1471ms, lr: 1.0662368e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:11,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43778 samples/s/p 2:20:26 } +2024-07-25 22:51:14,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 774/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 1.0656497e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:14,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43194 samples/s/p 2:20:33 } +2024-07-25 22:51:17,837 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 776/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 1.0650628e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:17,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43180 samples/s/p 2:20:30 } +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 778/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0644755e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:20,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43827 samples/s/p 2:20:17 } +2024-07-25 22:51:23,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 780/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 1.0638886e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:23,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43054 samples/s/p 2:20:26 } +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 782/ 1625], loss: 0.979, per_step_time: 1471ms, lr: 1.0633018e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:26,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43499 samples/s/p 2:20:16 } +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 784/ 1625], loss: 1.250, per_step_time: 1473ms, lr: 1.062715e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:29,644 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43105 samples/s/p 2:20:19 } +2024-07-25 22:51:32,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 786/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 1.0621283e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:32,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43047 samples/s/p 2:20:17 } +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 788/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 1.0615418e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:35,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.8% |████████████████████████████████ | 5.43016 samples/s/p 2:20:15 } +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 790/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.0609552e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:38,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43445 samples/s/p 2:20:05 } +2024-07-25 22:51:41,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 792/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.0603689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:41,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43754 samples/s/p 2:19:57 } +2024-07-25 22:51:44,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 794/ 1625], loss: 1.330, per_step_time: 1473ms, lr: 1.0597825e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:44,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43020 samples/s/p 2:20:06 } +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 796/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0591963e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:47,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43247 samples/s/p 2:19:59 } +2024-07-25 22:51:50,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 798/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 1.0586102e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:50,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43300 samples/s/p 2:19:56 } +2024-07-25 22:51:53,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 800/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0580241e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:53,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43687 samples/s/p 2:19:47 } +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 802/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.0574383e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:56,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43322 samples/s/p 2:19:49 } +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 804/ 1625], loss: 1.417, per_step_time: 1471ms, lr: 1.0568523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:51:59,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 64.9% |████████████████████████████████ | 5.43713 samples/s/p 2:19:40 } +2024-07-25 22:52:02,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 806/ 1625], loss: 1.361, per_step_time: 1473ms, lr: 1.0562667e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:02,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43105 samples/s/p 2:19:47 } +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 808/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 1.055681e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:05,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43426 samples/s/p 2:19:39 } +2024-07-25 22:52:08,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 810/ 1625], loss: 0.900, per_step_time: 1470ms, lr: 1.05509525e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:08,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43909 samples/s/p 2:19:29 } +2024-07-25 22:52:10,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 812/ 1625], loss: 1.251, per_step_time: 1471ms, lr: 1.0545098e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:10,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43589 samples/s/p 2:19:31 } +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 814/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0539245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:13,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43241 samples/s/p 2:19:33 } +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 816/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0533389e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:16,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43709 samples/s/p 2:19:23 } +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 818/ 1625], loss: 1.343, per_step_time: 1472ms, lr: 1.05275385e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:19,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43402 samples/s/p 2:19:25 } +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 820/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 1.0521689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:22,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.0% |████████████████████████████████ | 5.43846 samples/s/p 2:19:15 } +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 822/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0515838e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:25,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43436 samples/s/p 2:19:18 } +2024-07-25 22:52:28,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 824/ 1625], loss: 1.286, per_step_time: 1472ms, lr: 1.0509987e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:28,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43425 samples/s/p 2:19:15 } +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 826/ 1625], loss: 1.294, per_step_time: 1474ms, lr: 1.0504141e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:31,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.42462 samples/s/p 2:19:27 } +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 828/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.0498291e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:34,576 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43272 samples/s/p 2:19:12 } +2024-07-25 22:52:37,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 830/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.0492444e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:37,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43520 samples/s/p 2:19:05 } +2024-07-25 22:52:40,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 832/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0486599e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:40,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43452 samples/s/p 2:19:03 } +2024-07-25 22:52:43,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 834/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.0480753e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:43,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.43634 samples/s/p 2:18:57 } +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 836/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.04749115e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:46,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.1% |████████████████████████████████ | 5.44079 samples/s/p 2:18:48 } +2024-07-25 22:52:49,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 838/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 1.0469068e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:49,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43489 samples/s/p 2:18:54 } +2024-07-25 22:52:52,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 840/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.04632245e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:52,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43840 samples/s/p 2:18:45 } +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 842/ 1625], loss: 1.301, per_step_time: 1470ms, lr: 1.0457384e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:55,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44081 samples/s/p 2:18:39 } +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 844/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 1.0451544e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:52:58,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44089 samples/s/p 2:18:36 } +2024-07-25 22:53:01,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 846/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 1.0445704e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:01,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43496 samples/s/p 2:18:42 } +2024-07-25 22:53:04,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 848/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.0439867e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:04,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43855 samples/s/p 2:18:33 } +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 850/ 1625], loss: 1.063, per_step_time: 1469ms, lr: 1.043403e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:07,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.44332 samples/s/p 2:18:23 } +2024-07-25 22:53:09,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 852/ 1625], loss: 1.396, per_step_time: 1472ms, lr: 1.0428194e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:09,971 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.2% |████████████████████████████████ | 5.43162 samples/s/p 2:18:38 } +2024-07-25 22:53:12,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 854/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.0422356e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:12,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43564 samples/s/p 2:18:29 } +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 856/ 1625], loss: 1.026, per_step_time: 1470ms, lr: 1.0416523e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:15,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43902 samples/s/p 2:18:21 } +2024-07-25 22:53:18,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 858/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 1.0410689e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:18,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43372 samples/s/p 2:18:26 } +2024-07-25 22:53:21,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 860/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.0404857e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:21,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43600 samples/s/p 2:18:20 } +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 862/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0399025e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:24,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43938 samples/s/p 2:18:12 } +2024-07-25 22:53:27,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 864/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.0393195e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:27,670 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43764 samples/s/p 2:18:11 } +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 866/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 1.03873645e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:30,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43138 samples/s/p 2:18:18 } +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 868/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.0381535e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:33,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.3% |████████████████████████████████ | 5.43454 samples/s/p 2:18:10 } +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 870/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.03757075e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:36,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43364 samples/s/p 2:18:09 } +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 872/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.036988e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:39,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43804 samples/s/p 2:17:59 } +2024-07-25 22:53:42,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 874/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 1.0364055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:42,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43767 samples/s/p 2:17:57 } +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 876/ 1625], loss: 1.165, per_step_time: 1469ms, lr: 1.035823e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44327 samples/s/p 2:17:45 } +2024-07-25 22:53:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 878/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.03524035e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:48,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43722 samples/s/p 2:17:51 } +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 880/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 1.0346582e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44121 samples/s/p 2:17:42 } +2024-07-25 22:53:54,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 882/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 1.0340759e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:54,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.44124 samples/s/p 2:17:39 } +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 884/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 1.0334936e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:53:57,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.4% |████████████████████████████████ | 5.43402 samples/s/p 2:17:47 } +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 886/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.0329118e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:00,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43308 samples/s/p 2:17:46 } +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 888/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.03233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:03,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43052 samples/s/p 2:17:47 } +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 890/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 1.031748e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:06,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43234 samples/s/p 2:17:41 } +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 892/ 1625], loss: 0.970, per_step_time: 1472ms, lr: 1.0311662e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:08,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43128 samples/s/p 2:17:40 } +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 894/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0305846e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:11,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43134 samples/s/p 2:17:37 } +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 896/ 1625], loss: 1.133, per_step_time: 1469ms, lr: 1.0300029e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:14,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.44248 samples/s/p 2:17:17 } +2024-07-25 22:54:17,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 898/ 1625], loss: 1.080, per_step_time: 1473ms, lr: 1.0294214e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:17,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.43048 samples/s/p 2:17:32 } +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 900/ 1625], loss: 1.331, per_step_time: 1473ms, lr: 1.0288402e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:20,784 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.5% |████████████████████████████████ | 5.42799 samples/s/p 2:17:33 } +2024-07-25 22:54:23,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 902/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.0282591e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:23,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43692 samples/s/p 2:17:17 } +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 904/ 1625], loss: 1.455, per_step_time: 1469ms, lr: 1.0276777e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:26,681 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44254 samples/s/p 2:17:05 } +2024-07-25 22:54:29,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 906/ 1625], loss: 1.311, per_step_time: 1471ms, lr: 1.0270966e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:29,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43572 samples/s/p 2:17:12 } +2024-07-25 22:54:32,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 908/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 1.0265158e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:32,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44036 samples/s/p 2:17:02 } +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 910/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 1.0259348e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:35,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.42980 samples/s/p 2:17:16 } +2024-07-25 22:54:38,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 912/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 1.025354e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:38,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43558 samples/s/p 2:17:04 } +2024-07-25 22:54:41,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 914/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0247734e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:41,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.43209 samples/s/p 2:17:06 } +2024-07-25 22:54:44,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 916/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.0241926e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:44,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44109 samples/s/p 2:16:50 } +2024-07-25 22:54:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 918/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 1.0236123e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:47,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.6% |████████████████████████████████ | 5.44214 samples/s/p 2:16:45 } +2024-07-25 22:54:50,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 920/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 1.0230318e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:50,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43483 samples/s/p 2:16:53 } +2024-07-25 22:54:53,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 922/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.0224514e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:53,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43920 samples/s/p 2:16:44 } +2024-07-25 22:54:56,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 924/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.0218713e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:56,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43207 samples/s/p 2:16:51 } +2024-07-25 22:54:59,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 926/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.0212912e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:54:59,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43472 samples/s/p 2:16:45 } +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 928/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.020711e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:02,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43736 samples/s/p 2:16:38 } +2024-07-25 22:55:05,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 930/ 1625], loss: 1.301, per_step_time: 1471ms, lr: 1.0201312e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:05,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43656 samples/s/p 2:16:36 } +2024-07-25 22:55:07,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 932/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 1.0195516e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:07,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.43778 samples/s/p 2:16:31 } +2024-07-25 22:55:10,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 934/ 1625], loss: 1.258, per_step_time: 1475ms, lr: 1.0189717e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:10,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.7% |████████████████████████████████ | 5.42212 samples/s/p 2:16:52 } +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 936/ 1625], loss: 1.214, per_step_time: 1473ms, lr: 1.01839205e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:13,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43095 samples/s/p 2:16:35 } +2024-07-25 22:55:16,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 938/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.0178127e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:16,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43402 samples/s/p 2:16:28 } +2024-07-25 22:55:19,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 940/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 1.017233e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:19,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43301 samples/s/p 2:16:26 } +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 942/ 1625], loss: 1.010, per_step_time: 1471ms, lr: 1.0166537e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:22,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43540 samples/s/p 2:16:20 } +2024-07-25 22:55:25,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 944/ 1625], loss: 1.362, per_step_time: 1473ms, lr: 1.0160747e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:25,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.42975 samples/s/p 2:16:26 } +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 946/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.0154953e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:28,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43944 samples/s/p 2:16:08 } +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 948/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.0149164e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:31,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43381 samples/s/p 2:16:14 } +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 950/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.0143374e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:34,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.8% |████████████████████████████████ | 5.43805 samples/s/p 2:16:04 } +2024-07-25 22:55:37,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 952/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 1.0137587e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:37,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43518 samples/s/p 2:16:06 } +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 954/ 1625], loss: 1.328, per_step_time: 1470ms, lr: 1.0131798e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:40,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44188 samples/s/p 2:15:53 } +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 956/ 1625], loss: 1.227, per_step_time: 1473ms, lr: 1.0126013e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:43,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43047 samples/s/p 2:16:07 } +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 958/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.0120229e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:46,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43825 samples/s/p 2:15:52 } +2024-07-25 22:55:49,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 960/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0114442e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:49,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43562 samples/s/p 2:15:53 } +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 962/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.0108661e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:52,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43353 samples/s/p 2:15:53 } +2024-07-25 22:55:55,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 964/ 1625], loss: 1.234, per_step_time: 1469ms, lr: 1.0102878e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:55,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.44263 samples/s/p 2:15:37 } +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 966/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 1.0097095e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:55:58,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 65.9% |████████████████████████████████ | 5.43571 samples/s/p 2:15:44 } +2024-07-25 22:56:01,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 968/ 1625], loss: 1.263, per_step_time: 1470ms, lr: 1.0091317e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:01,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.44036 samples/s/p 2:15:34 } +2024-07-25 22:56:04,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 970/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.0085536e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:04,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43364 samples/s/p 2:15:41 } +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 972/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.0079756e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:07,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43318 samples/s/p 2:15:39 } +2024-07-25 22:56:09,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 974/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.0073981e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:09,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |████████████████████████████████ | 5.43762 samples/s/p 2:15:30 } +2024-07-25 22:56:12,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 976/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.00682055e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:12,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43485 samples/s/p 2:15:31 } +2024-07-25 22:56:15,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 978/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0062429e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:15,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43783 samples/s/p 2:15:23 } +2024-07-25 22:56:18,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 980/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 1.0056654e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:18,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43435 samples/s/p 2:15:26 } +2024-07-25 22:56:21,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 982/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0050881e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:21,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.0% |█████████████████████████████████ | 5.43178 samples/s/p 2:15:26 } +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 984/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0045107e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:24,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43519 samples/s/p 2:15:18 } +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 986/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.0039336e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:27,658 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43465 samples/s/p 2:15:16 } +2024-07-25 22:56:30,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 988/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0033567e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:30,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43361 samples/s/p 2:15:15 } +2024-07-25 22:56:33,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 990/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 1.0027797e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:33,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.42858 samples/s/p 2:15:19 } +2024-07-25 22:56:36,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 992/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 1.00220295e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:36,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43125 samples/s/p 2:15:13 } +2024-07-25 22:56:39,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 994/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 1.00162615e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:39,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43060 samples/s/p 2:15:11 } +2024-07-25 22:56:42,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 996/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.00104935e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:42,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43729 samples/s/p 2:14:58 } +2024-07-25 22:56:45,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 998/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 1.0004731e-05, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:45,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.1% |█████████████████████████████████ | 5.43655 samples/s/p 2:14:56 } +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1000/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 9.998966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:48,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43782 samples/s/p 2:14:51 } +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1002/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 9.993204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:51,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43983 samples/s/p 2:14:45 } +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1004/ 1625], loss: 1.277, per_step_time: 1471ms, lr: 9.9874405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:54,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43780 samples/s/p 2:14:45 } +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1006/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 9.981681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:56:57,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43484 samples/s/p 2:14:47 } +2024-07-25 22:57:00,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1008/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 9.975919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:00,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43254 samples/s/p 2:14:47 } +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1010/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 9.970159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:03,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43153 samples/s/p 2:14:46 } +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1012/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.964402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:06,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43997 samples/s/p 2:14:30 } +2024-07-25 22:57:08,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1014/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 9.958644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:08,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.2% |█████████████████████████████████ | 5.43443 samples/s/p 2:14:35 } +2024-07-25 22:57:11,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1016/ 1625], loss: 1.259, per_step_time: 1471ms, lr: 9.952889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:11,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43814 samples/s/p 2:14:27 } +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1018/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 9.9471345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:14,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43591 samples/s/p 2:14:27 } +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1020/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 9.941381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:17,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43632 samples/s/p 2:14:24 } +2024-07-25 22:57:20,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1022/ 1625], loss: 1.217, per_step_time: 1470ms, lr: 9.935626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:20,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43875 samples/s/p 2:14:17 } +2024-07-25 22:57:23,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1024/ 1625], loss: 1.240, per_step_time: 1472ms, lr: 9.929874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:23,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43299 samples/s/p 2:14:23 } +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1026/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 9.924124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:26,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43370 samples/s/p 2:14:19 } +2024-07-25 22:57:29,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1028/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 9.918373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:29,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43324 samples/s/p 2:14:17 } +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1030/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 9.9126255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:32,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.3% |█████████████████████████████████ | 5.43707 samples/s/p 2:14:08 } +2024-07-25 22:57:35,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1032/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 9.906877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:35,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43087 samples/s/p 2:14:14 } +2024-07-25 22:57:38,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1034/ 1625], loss: 1.413, per_step_time: 1471ms, lr: 9.901129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:38,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43541 samples/s/p 2:14:05 } +2024-07-25 22:57:41,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1036/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 9.895383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:41,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43839 samples/s/p 2:13:57 } +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1038/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 9.88964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:44,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43409 samples/s/p 2:14:01 } +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1040/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 9.883894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:47,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43432 samples/s/p 2:13:57 } +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1042/ 1625], loss: 1.234, per_step_time: 1471ms, lr: 9.878152e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:50,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43640 samples/s/p 2:13:51 } +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1044/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 9.872412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:53,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43357 samples/s/p 2:13:53 } +2024-07-25 22:57:56,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1046/ 1625], loss: 1.119, per_step_time: 1473ms, lr: 9.866669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:56,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.42793 samples/s/p 2:13:58 } +2024-07-25 22:57:59,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1048/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 9.860931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:57:59,139 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.4% |█████████████████████████████████ | 5.43298 samples/s/p 2:13:48 } +2024-07-25 22:58:02,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1050/ 1625], loss: 0.856, per_step_time: 1471ms, lr: 9.855194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:02,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43795 samples/s/p 2:13:37 } +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1052/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 9.849455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:05,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43803 samples/s/p 2:13:34 } +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1054/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 9.843717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:07,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43230 samples/s/p 2:13:40 } +2024-07-25 22:58:10,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1056/ 1625], loss: 1.144, per_step_time: 1469ms, lr: 9.837982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:10,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.44438 samples/s/p 2:13:19 } +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1058/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 9.83225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:13,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43174 samples/s/p 2:13:35 } +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1060/ 1625], loss: 1.350, per_step_time: 1472ms, lr: 9.826515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:16,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43415 samples/s/p 2:13:28 } +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1062/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 9.820782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:19,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43268 samples/s/p 2:13:27 } +2024-07-25 22:58:22,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1064/ 1625], loss: 1.202, per_step_time: 1472ms, lr: 9.815052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:22,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.5% |█████████████████████████████████ | 5.43235 samples/s/p 2:13:25 } +2024-07-25 22:58:25,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1066/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 9.8093205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:25,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.44078 samples/s/p 2:13:10 } +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1068/ 1625], loss: 1.151, per_step_time: 1475ms, lr: 9.803592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:28,648 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.42372 samples/s/p 2:13:32 } +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1070/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 9.797865e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:31,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43084 samples/s/p 2:13:18 } +2024-07-25 22:58:34,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1072/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 9.792137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:34,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43804 samples/s/p 2:13:05 } +2024-07-25 22:58:37,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1074/ 1625], loss: 1.028, per_step_time: 1471ms, lr: 9.786411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:37,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43708 samples/s/p 2:13:03 } +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1076/ 1625], loss: 1.238, per_step_time: 1476ms, lr: 9.780687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:40,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.41882 samples/s/p 2:13:27 } +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1078/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 9.774961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:43,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43664 samples/s/p 2:12:58 } +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1080/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 9.769238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:46,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.6% |█████████████████████████████████ | 5.43707 samples/s/p 2:12:54 } +2024-07-25 22:58:49,310 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1082/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 9.7635175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:49,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43529 samples/s/p 2:12:54 } +2024-07-25 22:58:52,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1084/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 9.757795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:52,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43687 samples/s/p 2:12:49 } +2024-07-25 22:58:55,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1086/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 9.752076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:55,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43962 samples/s/p 2:12:42 } +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1088/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 9.74636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:58:58,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44027 samples/s/p 2:12:38 } +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1090/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 9.74064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:01,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44040 samples/s/p 2:12:35 } +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1092/ 1625], loss: 0.914, per_step_time: 1470ms, lr: 9.734924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:04,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.44142 samples/s/p 2:12:30 } +2024-07-25 22:59:07,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1094/ 1625], loss: 1.004, per_step_time: 1471ms, lr: 9.72921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:07,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43642 samples/s/p 2:12:35 } +2024-07-25 22:59:09,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1096/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 9.723492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:09,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.7% |█████████████████████████████████ | 5.43495 samples/s/p 2:12:34 } +2024-07-25 22:59:12,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1098/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 9.71778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:12,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43087 samples/s/p 2:12:37 } +2024-07-25 22:59:15,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1100/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 9.712069e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:15,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43449 samples/s/p 2:12:29 } +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1102/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 9.706359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:18,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43008 samples/s/p 2:12:32 } +2024-07-25 22:59:21,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1104/ 1625], loss: 1.245, per_step_time: 1474ms, lr: 9.700648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:21,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42583 samples/s/p 2:12:36 } +2024-07-25 22:59:24,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1106/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.694939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:24,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42931 samples/s/p 2:12:27 } +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1108/ 1625], loss: 1.100, per_step_time: 1475ms, lr: 9.689233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:27,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.42253 samples/s/p 2:12:34 } +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1110/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 9.683524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:30,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43326 samples/s/p 2:12:16 } +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1112/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 9.677818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:33,581 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.8% |█████████████████████████████████ | 5.43478 samples/s/p 2:12:11 } +2024-07-25 22:59:36,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1114/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 9.672114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:36,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43702 samples/s/p 2:12:04 } +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1116/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 9.66641e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:39,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43684 samples/s/p 2:12:02 } +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1118/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 9.660708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:42,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43528 samples/s/p 2:12:01 } +2024-07-25 22:59:45,380 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1120/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 9.655007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:45,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43747 samples/s/p 2:11:55 } +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1122/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.649304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:48,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43534 samples/s/p 2:11:55 } +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1124/ 1625], loss: 1.076, per_step_time: 1470ms, lr: 9.643607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:51,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.43888 samples/s/p 2:11:47 } +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1126/ 1625], loss: 1.224, per_step_time: 1473ms, lr: 9.637908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:54,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42814 samples/s/p 2:12:00 } +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1128/ 1625], loss: 1.062, per_step_time: 1474ms, lr: 9.632209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 22:59:57,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 66.9% |█████████████████████████████████ | 5.42693 samples/s/p 2:11:59 } +2024-07-25 23:00:00,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1130/ 1625], loss: 1.277, per_step_time: 1473ms, lr: 9.626515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:00,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43038 samples/s/p 2:11:51 } +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1132/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.620821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:03,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43967 samples/s/p 2:11:34 } +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1134/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 9.615126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:06,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43195 samples/s/p 2:11:42 } +2024-07-25 23:00:08,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1136/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 9.609432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:08,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.42723 samples/s/p 2:11:46 } +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1138/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 9.603742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:11,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43683 samples/s/p 2:11:29 } +2024-07-25 23:00:14,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1140/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 9.5980495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:14,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43787 samples/s/p 2:11:25 } +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1142/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 9.592361e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:17,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43542 samples/s/p 2:11:26 } +2024-07-25 23:00:20,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1144/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 9.586673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:20,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.0% |█████████████████████████████████ | 5.43148 samples/s/p 2:11:28 } +2024-07-25 23:00:23,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1146/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 9.580984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:23,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42943 samples/s/p 2:11:28 } +2024-07-25 23:00:26,704 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1148/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 9.5752985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43806 samples/s/p 2:11:13 } +2024-07-25 23:00:29,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1150/ 1625], loss: 1.355, per_step_time: 1470ms, lr: 9.569613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:29,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43890 samples/s/p 2:11:09 } +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1152/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 9.563931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:32,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42987 samples/s/p 2:11:19 } +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1154/ 1625], loss: 1.064, per_step_time: 1469ms, lr: 9.558246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:35,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.44325 samples/s/p 2:10:57 } +2024-07-25 23:00:38,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1156/ 1625], loss: 0.959, per_step_time: 1473ms, lr: 9.552564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:38,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42976 samples/s/p 2:11:13 } +2024-07-25 23:00:41,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1158/ 1625], loss: 1.231, per_step_time: 1472ms, lr: 9.546885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:41,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.43153 samples/s/p 2:11:08 } +2024-07-25 23:00:44,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1160/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 9.541203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:44,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.1% |█████████████████████████████████ | 5.42977 samples/s/p 2:11:07 } +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1162/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.535527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:47,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43736 samples/s/p 2:10:53 } +2024-07-25 23:00:50,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1164/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 9.529848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:50,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43392 samples/s/p 2:10:55 } +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1166/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 9.52417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:53,268 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43123 samples/s/p 2:10:56 } +2024-07-25 23:00:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1168/ 1625], loss: 1.204, per_step_time: 1473ms, lr: 9.518497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:56,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.42854 samples/s/p 2:10:57 } +2024-07-25 23:00:59,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1170/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 9.5128225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:00:59,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44171 samples/s/p 2:10:35 } +2024-07-25 23:01:02,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1172/ 1625], loss: 1.204, per_step_time: 1470ms, lr: 9.507149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:02,119 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43870 samples/s/p 2:10:37 } +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1174/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 9.5014775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:05,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43547 samples/s/p 2:10:38 } +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1176/ 1625], loss: 0.935, per_step_time: 1468ms, lr: 9.495808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:08,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.44600 samples/s/p 2:10:20 } +2024-07-25 23:01:10,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1178/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 9.490135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:10,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.2% |█████████████████████████████████ | 5.43392 samples/s/p 2:10:35 } +2024-07-25 23:01:13,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1180/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 9.484467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:13,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43607 samples/s/p 2:10:29 } +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1182/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 9.478801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:16,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43515 samples/s/p 2:10:27 } +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1184/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 9.473134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:19,821 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42965 samples/s/p 2:10:32 } +2024-07-25 23:01:22,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1186/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 9.46747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:22,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43534 samples/s/p 2:10:21 } +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1188/ 1625], loss: 1.081, per_step_time: 1470ms, lr: 9.461806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:25,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43931 samples/s/p 2:10:12 } +2024-07-25 23:01:28,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1190/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 9.45614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:28,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.43202 samples/s/p 2:10:20 } +2024-07-25 23:01:31,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1192/ 1625], loss: 1.165, per_step_time: 1475ms, lr: 9.450478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:31,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42338 samples/s/p 2:10:29 } +2024-07-25 23:01:34,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1194/ 1625], loss: 1.241, per_step_time: 1473ms, lr: 9.4448205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.3% |█████████████████████████████████ | 5.42797 samples/s/p 2:10:20 } +2024-07-25 23:01:37,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1196/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 9.439157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:37,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43701 samples/s/p 2:10:04 } +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1198/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 9.433498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:40,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43498 samples/s/p 2:10:04 } +2024-07-25 23:01:43,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1200/ 1625], loss: 1.250, per_step_time: 1475ms, lr: 9.427843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:43,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42266 samples/s/p 2:10:19 } +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1202/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 9.422187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43430 samples/s/p 2:09:59 } +2024-07-25 23:01:49,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1204/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 9.416531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:49,344 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43699 samples/s/p 2:09:52 } +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1206/ 1625], loss: 1.291, per_step_time: 1473ms, lr: 9.410877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:52,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.42846 samples/s/p 2:10:01 } +2024-07-25 23:01:55,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1208/ 1625], loss: 0.939, per_step_time: 1472ms, lr: 9.405225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:55,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43321 samples/s/p 2:09:52 } +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1210/ 1625], loss: 0.981, per_step_time: 1471ms, lr: 9.399572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:01:58,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.4% |█████████████████████████████████ | 5.43562 samples/s/p 2:09:45 } +2024-07-25 23:02:01,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1212/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 9.393922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:01,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43380 samples/s/p 2:09:45 } +2024-07-25 23:02:04,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1214/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 9.388271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:04,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44172 samples/s/p 2:09:31 } +2024-07-25 23:02:07,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1216/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 9.382622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:07,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43447 samples/s/p 2:09:38 } +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1218/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 9.376975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:09,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.44152 samples/s/p 2:09:25 } +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1220/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 9.371329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:12,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43809 samples/s/p 2:09:27 } +2024-07-25 23:02:15,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1222/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 9.365684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:15,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43911 samples/s/p 2:09:23 } +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1224/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 9.36004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:18,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43618 samples/s/p 2:09:24 } +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1226/ 1625], loss: 0.925, per_step_time: 1471ms, lr: 9.354397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:21,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.5% |█████████████████████████████████ | 5.43776 samples/s/p 2:09:19 } +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1228/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 9.348755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:24,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43964 samples/s/p 2:09:13 } +2024-07-25 23:02:27,689 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1230/ 1625], loss: 0.979, per_step_time: 1469ms, lr: 9.3431145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:27,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.44285 samples/s/p 2:09:05 } +2024-07-25 23:02:30,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1232/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 9.337477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:30,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43965 samples/s/p 2:09:07 } +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1234/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 9.331837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:33,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43284 samples/s/p 2:09:14 } +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1236/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 9.326199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:36,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43233 samples/s/p 2:09:12 } +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1238/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 9.320565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:39,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43144 samples/s/p 2:09:10 } +2024-07-25 23:02:42,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1240/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 9.314927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:42,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43553 samples/s/p 2:09:01 } +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1242/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 9.309294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:45,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.6% |█████████████████████████████████ | 5.43156 samples/s/p 2:09:04 } +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1244/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 9.303664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:48,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43637 samples/s/p 2:08:54 } +2024-07-25 23:02:51,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1246/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 9.29803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:51,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43320 samples/s/p 2:08:56 } +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1248/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 9.292402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:54,251 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43767 samples/s/p 2:08:46 } +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1250/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 9.286772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:02:57,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43585 samples/s/p 2:08:46 } +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1252/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 9.281144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:00,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43056 samples/s/p 2:08:51 } +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1254/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 9.275517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:03,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.43871 samples/s/p 2:08:36 } +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1256/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 9.269891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:06,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.44030 samples/s/p 2:08:31 } +2024-07-25 23:03:09,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1258/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 9.264267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:09,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.7% |█████████████████████████████████ | 5.42920 samples/s/p 2:08:44 } +2024-07-25 23:03:11,953 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1260/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 9.258643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:11,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43908 samples/s/p 2:08:27 } +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1262/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 9.25302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:14,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43154 samples/s/p 2:08:34 } +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1264/ 1625], loss: 1.306, per_step_time: 1470ms, lr: 9.247399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:17,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43884 samples/s/p 2:08:21 } +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1266/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 9.2417795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:20,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43989 samples/s/p 2:08:17 } +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1268/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 9.236161e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:23,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43456 samples/s/p 2:08:21 } +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1270/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.230546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:26,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43397 samples/s/p 2:08:19 } +2024-07-25 23:03:29,654 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1272/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 9.2249265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:29,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43814 samples/s/p 2:08:10 } +2024-07-25 23:03:32,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1274/ 1625], loss: 1.331, per_step_time: 1471ms, lr: 9.21931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:32,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.8% |█████████████████████████████████ | 5.43827 samples/s/p 2:08:07 } +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1276/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 9.2137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:35,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42778 samples/s/p 2:08:19 } +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1278/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 9.208084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:38,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43478 samples/s/p 2:08:06 } +2024-07-25 23:03:41,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1280/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 9.202471e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:41,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43965 samples/s/p 2:07:56 } +2024-07-25 23:03:44,408 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1282/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 9.196864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:44,409 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43397 samples/s/p 2:08:02 } +2024-07-25 23:03:47,359 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1284/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 9.191251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:47,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43494 samples/s/p 2:07:57 } +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1286/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 9.1856455e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:50,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43375 samples/s/p 2:07:56 } +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1288/ 1625], loss: 1.146, per_step_time: 1475ms, lr: 9.180038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:53,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.42191 samples/s/p 2:08:10 } +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1290/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 9.174429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:56,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 67.9% |█████████████████████████████████ | 5.43149 samples/s/p 2:07:53 } +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1292/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 9.168827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:03:59,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43215 samples/s/p 2:07:49 } +2024-07-25 23:04:02,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1294/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 9.163223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:02,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.42974 samples/s/p 2:07:50 } +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1296/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 9.157618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:05,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43604 samples/s/p 2:07:38 } +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1298/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 9.152019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:08,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |█████████████████████████████████ | 5.43817 samples/s/p 2:07:32 } +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1300/ 1625], loss: 1.401, per_step_time: 1470ms, lr: 9.146418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:10,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43948 samples/s/p 2:07:27 } +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1302/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 9.140819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:13,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43395 samples/s/p 2:07:32 } +2024-07-25 23:04:16,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1304/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 9.13522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:16,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43574 samples/s/p 2:07:27 } +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1306/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 9.129623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:19,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43378 samples/s/p 2:07:26 } +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1308/ 1625], loss: 0.967, per_step_time: 1472ms, lr: 9.124028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:22,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.0% |██████████████████████████████████ | 5.43216 samples/s/p 2:07:26 } +2024-07-25 23:04:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1310/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 9.118434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:25,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43990 samples/s/p 2:07:12 } +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1312/ 1625], loss: 1.311, per_step_time: 1472ms, lr: 9.112841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:28,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43374 samples/s/p 2:07:18 } +2024-07-25 23:04:31,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1314/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 9.107252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:31,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43691 samples/s/p 2:07:10 } +2024-07-25 23:04:34,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1316/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 9.101657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:34,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43321 samples/s/p 2:07:13 } +2024-07-25 23:04:37,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1318/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 9.0960675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:37,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43869 samples/s/p 2:07:02 } +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1320/ 1625], loss: 1.109, per_step_time: 1474ms, lr: 9.090482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:40,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.42472 samples/s/p 2:07:19 } +2024-07-25 23:04:43,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1322/ 1625], loss: 1.106, per_step_time: 1472ms, lr: 9.084893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:43,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43426 samples/s/p 2:07:02 } +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1324/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 9.079306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:46,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.1% |██████████████████████████████████ | 5.43185 samples/s/p 2:07:03 } +2024-07-25 23:04:49,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1326/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 9.073725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:49,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43533 samples/s/p 2:06:55 } +2024-07-25 23:04:52,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1328/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 9.068137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:52,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43229 samples/s/p 2:06:56 } +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1330/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 9.062558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:55,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43539 samples/s/p 2:06:49 } +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1332/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 9.056976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:04:58,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.44091 samples/s/p 2:06:38 } +2024-07-25 23:05:01,145 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1334/ 1625], loss: 1.368, per_step_time: 1472ms, lr: 9.051393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:01,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43466 samples/s/p 2:06:44 } +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1336/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 9.045816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:04,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43752 samples/s/p 2:06:37 } +2024-07-25 23:05:07,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1338/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 9.040239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:07,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43099 samples/s/p 2:06:43 } +2024-07-25 23:05:09,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1340/ 1625], loss: 0.975, per_step_time: 1471ms, lr: 9.034659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:10,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.2% |██████████████████████████████████ | 5.43512 samples/s/p 2:06:35 } +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1342/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 9.029087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:12,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43552 samples/s/p 2:06:31 } +2024-07-25 23:05:15,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1344/ 1625], loss: 1.305, per_step_time: 1472ms, lr: 9.023513e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:15,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43236 samples/s/p 2:06:33 } +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1346/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 9.017939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:18,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.44102 samples/s/p 2:06:17 } +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1348/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 9.012367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:21,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43562 samples/s/p 2:06:22 } +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1350/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 9.006797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:24,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.43713 samples/s/p 2:06:17 } +2024-07-25 23:05:27,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1352/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 9.001227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:27,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.44029 samples/s/p 2:06:10 } +2024-07-25 23:05:30,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1354/ 1625], loss: 1.218, per_step_time: 1474ms, lr: 8.995658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:30,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42741 samples/s/p 2:06:25 } +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1356/ 1625], loss: 1.074, per_step_time: 1474ms, lr: 8.990091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:33,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.3% |██████████████████████████████████ | 5.42516 samples/s/p 2:06:25 } +2024-07-25 23:05:36,562 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1358/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 8.984529e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:36,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43233 samples/s/p 2:06:12 } +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1360/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 8.978961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:39,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44088 samples/s/p 2:05:57 } +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1362/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 8.973397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:42,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43791 samples/s/p 2:05:58 } +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1364/ 1625], loss: 0.968, per_step_time: 1473ms, lr: 8.967838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:45,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.42751 samples/s/p 2:06:10 } +2024-07-25 23:05:48,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1366/ 1625], loss: 1.122, per_step_time: 1473ms, lr: 8.962274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:48,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.42962 samples/s/p 2:06:04 } +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1368/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 8.956715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:51,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43690 samples/s/p 2:05:51 } +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1370/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 8.951159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:54,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.43797 samples/s/p 2:05:46 } +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1372/ 1625], loss: 1.034, per_step_time: 1468ms, lr: 8.945599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:05:57,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.4% |██████████████████████████████████ | 5.44735 samples/s/p 2:05:31 } +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1374/ 1625], loss: 0.906, per_step_time: 1471ms, lr: 8.940045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:00,161 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43725 samples/s/p 2:05:42 } +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1376/ 1625], loss: 1.126, per_step_time: 1471ms, lr: 8.93449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:03,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43694 samples/s/p 2:05:39 } +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1378/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 8.928933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:06,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43073 samples/s/p 2:05:45 } +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1380/ 1625], loss: 1.162, per_step_time: 1473ms, lr: 8.923384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:09,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43066 samples/s/p 2:05:42 } +2024-07-25 23:06:11,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1382/ 1625], loss: 1.143, per_step_time: 1474ms, lr: 8.917832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:11,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42627 samples/s/p 2:05:45 } +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1384/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 8.912279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:14,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43174 samples/s/p 2:05:34 } +2024-07-25 23:06:17,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1386/ 1625], loss: 1.258, per_step_time: 1473ms, lr: 8.906733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:17,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.42985 samples/s/p 2:05:34 } +2024-07-25 23:06:20,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1388/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 8.9011855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:20,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.5% |██████████████████████████████████ | 5.43794 samples/s/p 2:05:20 } +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1390/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 8.8956385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:23,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43898 samples/s/p 2:05:16 } +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1392/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 8.890093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:26,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43706 samples/s/p 2:05:15 } +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1394/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 8.884548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:29,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43416 samples/s/p 2:05:16 } +2024-07-25 23:06:32,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1396/ 1625], loss: 1.116, per_step_time: 1471ms, lr: 8.879007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:32,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43574 samples/s/p 2:05:11 } +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1398/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 8.873465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:35,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42836 samples/s/p 2:05:19 } +2024-07-25 23:06:38,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1400/ 1625], loss: 1.202, per_step_time: 1470ms, lr: 8.8679235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:38,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.44046 samples/s/p 2:04:59 } +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1402/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.862388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:41,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.42851 samples/s/p 2:05:12 } +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1404/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 8.856847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:44,437 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.6% |██████████████████████████████████ | 5.43146 samples/s/p 2:05:05 } +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1406/ 1625], loss: 0.921, per_step_time: 1470ms, lr: 8.851311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:47,385 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43985 samples/s/p 2:04:51 } +2024-07-25 23:06:50,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1408/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 8.845777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:50,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43964 samples/s/p 2:04:48 } +2024-07-25 23:06:53,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1410/ 1625], loss: 1.035, per_step_time: 1473ms, lr: 8.840241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:53,289 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42791 samples/s/p 2:05:01 } +2024-07-25 23:06:56,237 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1412/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.834708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:56,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43842 samples/s/p 2:04:44 } +2024-07-25 23:06:59,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1414/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 8.829178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:06:59,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.42871 samples/s/p 2:04:54 } +2024-07-25 23:07:02,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1416/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 8.823646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:02,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43711 samples/s/p 2:04:40 } +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1418/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 8.81812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:05,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.43742 samples/s/p 2:04:37 } +2024-07-25 23:07:08,038 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1420/ 1625], loss: 1.044, per_step_time: 1470ms, lr: 8.81259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:08,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.7% |██████████████████████████████████ | 5.44050 samples/s/p 2:04:29 } +2024-07-25 23:07:10,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1422/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 8.80706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:10,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44224 samples/s/p 2:04:24 } +2024-07-25 23:07:13,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1424/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 8.801538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:13,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43353 samples/s/p 2:04:33 } +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1426/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 8.796013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:16,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.44152 samples/s/p 2:04:19 } +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1428/ 1625], loss: 1.168, per_step_time: 1470ms, lr: 8.79049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:19,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43964 samples/s/p 2:04:19 } +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1430/ 1625], loss: 1.459, per_step_time: 1470ms, lr: 8.7849685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:22,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43941 samples/s/p 2:04:16 } +2024-07-25 23:07:25,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1432/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 8.779447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:25,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43772 samples/s/p 2:04:16 } +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1434/ 1625], loss: 1.256, per_step_time: 1473ms, lr: 8.773927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:28,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.42996 samples/s/p 2:04:23 } +2024-07-25 23:07:31,638 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1436/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 8.76841e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:31,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43010 samples/s/p 2:04:20 } +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1438/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 8.762892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:34,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.8% |██████████████████████████████████ | 5.43502 samples/s/p 2:04:10 } +2024-07-25 23:07:37,541 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1440/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 8.757377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:37,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43387 samples/s/p 2:04:09 } +2024-07-25 23:07:40,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1442/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 8.751863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:40,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43098 samples/s/p 2:04:10 } +2024-07-25 23:07:43,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1444/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 8.746349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:43,446 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43317 samples/s/p 2:04:04 } +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1446/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 8.740837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:46,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43711 samples/s/p 2:03:56 } +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1448/ 1625], loss: 1.171, per_step_time: 1473ms, lr: 8.7353255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:49,349 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43051 samples/s/p 2:04:02 } +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1450/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 8.729817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:07:52,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43671 samples/s/p 2:03:50 } +2024-07-25 23:07:52,300 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:08:28,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1452/ 1625], loss: 1.025, per_step_time: 1838ms, lr: 8.724312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:28,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 4.35254 samples/s/p 2:34:38 } +2024-07-25 23:08:31,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1454/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 8.718801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:31,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 68.9% |██████████████████████████████████ | 5.43242 samples/s/p 2:03:50 } +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1456/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 8.713299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:34,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.42792 samples/s/p 2:03:54 } +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1458/ 1625], loss: 1.152, per_step_time: 1470ms, lr: 8.707794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:37,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44151 samples/s/p 2:03:32 } +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1460/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 8.702288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:40,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.44022 samples/s/p 2:03:31 } +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1462/ 1625], loss: 0.991, per_step_time: 1471ms, lr: 8.696789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:43,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43755 samples/s/p 2:03:32 } +2024-07-25 23:08:46,497 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1464/ 1625], loss: 1.277, per_step_time: 1478ms, lr: 8.691288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:46,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.41205 samples/s/p 2:04:04 } +2024-07-25 23:08:49,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1466/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 8.685786e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:49,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43301 samples/s/p 2:03:32 } +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1468/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 8.680291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:52,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43580 samples/s/p 2:03:25 } +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1470/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 8.674794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:55,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.0% |██████████████████████████████████ | 5.43593 samples/s/p 2:03:22 } +2024-07-25 23:08:58,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1472/ 1625], loss: 1.291, per_step_time: 1471ms, lr: 8.669298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:08:58,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43558 samples/s/p 2:03:20 } +2024-07-25 23:09:01,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1474/ 1625], loss: 1.186, per_step_time: 1473ms, lr: 8.663804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:01,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42883 samples/s/p 2:03:26 } +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1476/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 8.658311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:04,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43386 samples/s/p 2:03:16 } +2024-07-25 23:09:07,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1478/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 8.652818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:07,158 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43350 samples/s/p 2:03:14 } +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1480/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 8.647328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:10,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42684 samples/s/p 2:03:20 } +2024-07-25 23:09:13,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1482/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 8.641839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:13,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.42807 samples/s/p 2:03:15 } +2024-07-25 23:09:16,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1484/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.63635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:16,020 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43257 samples/s/p 2:03:06 } +2024-07-25 23:09:18,969 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1486/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.630864e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:18,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.1% |██████████████████████████████████ | 5.43614 samples/s/p 2:02:58 } +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1488/ 1625], loss: 0.997, per_step_time: 1471ms, lr: 8.625377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:21,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43570 samples/s/p 2:02:56 } +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1490/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 8.619893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:24,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43067 samples/s/p 2:03:00 } +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1492/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 8.614409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:27,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43851 samples/s/p 2:02:46 } +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1494/ 1625], loss: 0.945, per_step_time: 1474ms, lr: 8.6089285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:30,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.42485 samples/s/p 2:03:02 } +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1496/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 8.603447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:33,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43615 samples/s/p 2:02:44 } +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1498/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 8.597967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:36,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43469 samples/s/p 2:02:43 } +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1500/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 8.592493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:39,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.44033 samples/s/p 2:02:32 } +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1502/ 1625], loss: 1.362, per_step_time: 1472ms, lr: 8.587017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:42,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.2% |██████████████████████████████████ | 5.43478 samples/s/p 2:02:37 } +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1504/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 8.581538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:45,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43839 samples/s/p 2:02:29 } +2024-07-25 23:09:48,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1506/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 8.576068e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:48,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43574 samples/s/p 2:02:29 } +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1508/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 8.570594e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:51,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43022 samples/s/p 2:02:34 } +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1510/ 1625], loss: 1.236, per_step_time: 1474ms, lr: 8.565119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:54,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42681 samples/s/p 2:02:36 } +2024-07-25 23:09:57,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1512/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 8.559652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:09:57,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.42828 samples/s/p 2:02:31 } +2024-07-25 23:10:00,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1514/ 1625], loss: 0.986, per_step_time: 1469ms, lr: 8.554183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:00,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.44366 samples/s/p 2:02:07 } +2024-07-25 23:10:03,236 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1516/ 1625], loss: 1.075, per_step_time: 1471ms, lr: 8.548715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:03,237 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43843 samples/s/p 2:02:11 } +2024-07-25 23:10:06,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1518/ 1625], loss: 1.097, per_step_time: 1470ms, lr: 8.543249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:06,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.3% |██████████████████████████████████ | 5.43941 samples/s/p 2:02:07 } +2024-07-25 23:10:09,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1520/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 8.537784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:09,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.44149 samples/s/p 2:02:01 } +2024-07-25 23:10:12,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1522/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 8.532321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:12,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43117 samples/s/p 2:02:12 } +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1524/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 8.5268575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:15,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43471 samples/s/p 2:02:04 } +2024-07-25 23:10:17,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1526/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 8.521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:17,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43645 samples/s/p 2:01:59 } +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1528/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 8.515936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:20,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43381 samples/s/p 2:02:00 } +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1530/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 8.5104775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:23,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43904 samples/s/p 2:01:50 } +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1532/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 8.505021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:26,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43475 samples/s/p 2:01:52 } +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1534/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 8.499564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:29,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.4% |██████████████████████████████████ | 5.43733 samples/s/p 2:01:46 } +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1536/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 8.494109e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:32,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43833 samples/s/p 2:01:42 } +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1538/ 1625], loss: 1.328, per_step_time: 1473ms, lr: 8.488656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:35,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42903 samples/s/p 2:01:51 } +2024-07-25 23:10:38,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1540/ 1625], loss: 1.013, per_step_time: 1470ms, lr: 8.483204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:38,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43937 samples/s/p 2:01:34 } +2024-07-25 23:10:41,595 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1542/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 8.477753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:41,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.42905 samples/s/p 2:01:45 } +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1544/ 1625], loss: 0.986, per_step_time: 1470ms, lr: 8.472306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:44,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43968 samples/s/p 2:01:28 } +2024-07-25 23:10:47,499 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1546/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 8.4668545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:47,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43440 samples/s/p 2:01:32 } +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1548/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 8.461408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:50,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.43217 samples/s/p 2:01:32 } +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1550/ 1625], loss: 1.124, per_step_time: 1482ms, lr: 8.455965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:53,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.5% |██████████████████████████████████ | 5.39587 samples/s/p 2:02:18 } +2024-07-25 23:10:56,377 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1552/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 8.45052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:56,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.42989 samples/s/p 2:01:30 } +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1554/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 8.445074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:10:59,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43357 samples/s/p 2:01:22 } +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1556/ 1625], loss: 1.084, per_step_time: 1470ms, lr: 8.439636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:02,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43909 samples/s/p 2:01:11 } +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1558/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 8.434195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:05,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43639 samples/s/p 2:01:12 } +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1560/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 8.428756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:08,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43807 samples/s/p 2:01:07 } +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1562/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 8.423317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:11,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43721 samples/s/p 2:01:05 } +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1564/ 1625], loss: 1.206, per_step_time: 1471ms, lr: 8.41788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:14,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43575 samples/s/p 2:01:04 } +2024-07-25 23:11:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1566/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 8.412446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43277 samples/s/p 2:01:05 } +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1568/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.407012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:19,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.6% |██████████████████████████████████ | 5.43556 samples/s/p 2:00:58 } +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1570/ 1625], loss: 1.127, per_step_time: 1473ms, lr: 8.401578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:22,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.42895 samples/s/p 2:01:04 } +2024-07-25 23:11:25,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1572/ 1625], loss: 1.227, per_step_time: 1469ms, lr: 8.396148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:25,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.44278 samples/s/p 2:00:43 } +2024-07-25 23:11:28,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1574/ 1625], loss: 1.042, per_step_time: 1470ms, lr: 8.390716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:28,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43868 samples/s/p 2:00:45 } +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1576/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 8.385287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.44015 samples/s/p 2:00:40 } +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1578/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 8.37986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:34,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43703 samples/s/p 2:00:42 } +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1580/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.3744335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:37,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43667 samples/s/p 2:00:39 } +2024-07-25 23:11:40,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1582/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 8.369009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:40,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43688 samples/s/p 2:00:36 } +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1584/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 8.363585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:43,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.7% |██████████████████████████████████ | 5.43359 samples/s/p 2:00:37 } +2024-07-25 23:11:46,539 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1586/ 1625], loss: 1.240, per_step_time: 1475ms, lr: 8.358163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:46,540 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.42139 samples/s/p 2:00:51 } +2024-07-25 23:11:49,489 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1588/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 8.352746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:49,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43641 samples/s/p 2:00:28 } +2024-07-25 23:11:52,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1590/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.347323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:52,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43336 samples/s/p 2:00:29 } +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1592/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 8.3419045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:55,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43206 samples/s/p 2:00:28 } +2024-07-25 23:11:58,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1594/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 8.33649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:11:58,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.42976 samples/s/p 2:00:28 } +2024-07-25 23:12:01,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1596/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 8.3310715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:01,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.44011 samples/s/p 2:00:11 } +2024-07-25 23:12:04,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1598/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 8.325661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:04,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43421 samples/s/p 2:00:16 } +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1600/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 8.320248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:07,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.8% |██████████████████████████████████ | 5.43567 samples/s/p 2:00:11 } +2024-07-25 23:12:10,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1602/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 8.314836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:10,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43680 samples/s/p 2:00:07 } +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1604/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 8.3094255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:13,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43962 samples/s/p 2:00:00 } +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1606/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 8.304017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:16,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43301 samples/s/p 2:00:06 } +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1608/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 8.298609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:19,000 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43035 samples/s/p 2:00:06 } +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1610/ 1625], loss: 0.941, per_step_time: 1472ms, lr: 8.293203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:21,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43465 samples/s/p 1:59:58 } +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1612/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.287798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:24,899 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.44003 samples/s/p 1:59:48 } +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1614/ 1625], loss: 1.266, per_step_time: 1477ms, lr: 8.282394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.41625 samples/s/p 2:00:16 } +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1616/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 8.276991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:30,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 69.9% |██████████████████████████████████ | 5.43099 samples/s/p 1:59:54 } +2024-07-25 23:12:33,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1618/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 8.271591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:33,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43730 samples/s/p 1:59:42 } +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1620/ 1625], loss: 1.401, per_step_time: 1471ms, lr: 8.266191e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:36,714 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43603 samples/s/p 1:59:41 } +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1622/ 1625], loss: 1.037, per_step_time: 1470ms, lr: 8.260793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:39,663 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.43920 samples/s/p 1:59:34 } +2024-07-25 23:12:42,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 7/ 10], step:[ 1624/ 1625], loss: 1.285, per_step_time: 1474ms, lr: 8.255394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:42,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |██████████████████████████████████ | 5.42377 samples/s/p 1:59:52 } +2024-07-25 23:12:45,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1/ 1625], loss: 1.079, per_step_time: 1471ms, lr: 8.250003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:45,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43713 samples/s/p 1:59:31 } +2024-07-25 23:12:48,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 3/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 8.244605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:48,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43598 samples/s/p 1:59:30 } +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 5/ 1625], loss: 1.005, per_step_time: 1472ms, lr: 8.239212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:51,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.43347 samples/s/p 1:59:30 } +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 7/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 8.233824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:54,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.0% |███████████████████████████████████ | 5.44008 samples/s/p 1:59:18 } +2024-07-25 23:12:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 9/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 8.2284305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:12:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43593 samples/s/p 1:59:21 } +2024-07-25 23:13:00,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 11/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 8.223042e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:00,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43782 samples/s/p 1:59:15 } +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 13/ 1625], loss: 1.318, per_step_time: 1471ms, lr: 8.217657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:03,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43782 samples/s/p 1:59:12 } +2024-07-25 23:13:06,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 15/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 8.212267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:06,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43594 samples/s/p 1:59:12 } +2024-07-25 23:13:09,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 17/ 1625], loss: 1.058, per_step_time: 1472ms, lr: 8.2068855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:09,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43232 samples/s/p 1:59:14 } +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 19/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.201501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:12,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43690 samples/s/p 1:59:05 } +2024-07-25 23:13:15,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 21/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 8.196116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:15,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43691 samples/s/p 1:59:02 } +2024-07-25 23:13:18,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 23/ 1625], loss: 1.287, per_step_time: 1471ms, lr: 8.190739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:18,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.1% |███████████████████████████████████ | 5.43528 samples/s/p 1:59:01 } +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 25/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 8.185359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43382 samples/s/p 1:59:00 } +2024-07-25 23:13:23,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 27/ 1625], loss: 1.206, per_step_time: 1470ms, lr: 8.179981e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:23,927 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43904 samples/s/p 1:58:50 } +2024-07-25 23:13:26,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 29/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 8.174604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:26,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43684 samples/s/p 1:58:50 } +2024-07-25 23:13:29,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 31/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 8.169228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:29,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43396 samples/s/p 1:58:51 } +2024-07-25 23:13:32,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 33/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 8.163854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:32,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43604 samples/s/p 1:58:45 } +2024-07-25 23:13:35,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 35/ 1625], loss: 1.082, per_step_time: 1471ms, lr: 8.158482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:35,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43498 samples/s/p 1:58:44 } +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 37/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 8.153111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43471 samples/s/p 1:58:41 } +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 39/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 8.14774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:41,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.2% |███████████████████████████████████ | 5.43516 samples/s/p 1:58:38 } +2024-07-25 23:13:44,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 41/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 8.1423705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:44,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43580 samples/s/p 1:58:34 } +2024-07-25 23:13:47,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 43/ 1625], loss: 1.228, per_step_time: 1470ms, lr: 8.1370035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:47,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.44025 samples/s/p 1:58:25 } +2024-07-25 23:13:50,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 45/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 8.13164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:50,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43654 samples/s/p 1:58:27 } +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 47/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 8.126273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:53,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43475 samples/s/p 1:58:26 } +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 49/ 1625], loss: 1.120, per_step_time: 1475ms, lr: 8.120909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:56,388 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42294 samples/s/p 1:58:39 } +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 51/ 1625], loss: 1.296, per_step_time: 1472ms, lr: 8.11555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:13:59,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43267 samples/s/p 1:58:23 } +2024-07-25 23:14:02,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 53/ 1625], loss: 1.118, per_step_time: 1475ms, lr: 8.110187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:02,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.42025 samples/s/p 1:58:37 } +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 55/ 1625], loss: 1.382, per_step_time: 1471ms, lr: 8.104828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:05,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.3% |███████████████████████████████████ | 5.43576 samples/s/p 1:58:13 } +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 57/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 8.099473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:08,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43244 samples/s/p 1:58:15 } +2024-07-25 23:14:11,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 59/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 8.094114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:11,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43850 samples/s/p 1:58:04 } +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 61/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 8.088761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:14,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43943 samples/s/p 1:58:00 } +2024-07-25 23:14:17,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 63/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 8.083408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:17,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43887 samples/s/p 1:57:57 } +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 65/ 1625], loss: 1.260, per_step_time: 1472ms, lr: 8.078052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:19,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43348 samples/s/p 1:58:02 } +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 67/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 8.072704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:22,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43867 samples/s/p 1:57:52 } +2024-07-25 23:14:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 69/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 8.067355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:25,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43164 samples/s/p 1:57:58 } +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 71/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 8.062004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43953 samples/s/p 1:57:45 } +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 73/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 8.05666e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:31,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.4% |███████████████████████████████████ | 5.43253 samples/s/p 1:57:51 } +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 75/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 8.051315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:34,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43263 samples/s/p 1:57:48 } +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 77/ 1625], loss: 0.892, per_step_time: 1470ms, lr: 8.0459695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:37,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.44037 samples/s/p 1:57:35 } +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 79/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 8.040627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42810 samples/s/p 1:57:48 } +2024-07-25 23:14:43,614 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 81/ 1625], loss: 1.188, per_step_time: 1475ms, lr: 8.035286e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:43,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42032 samples/s/p 1:57:55 } +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 83/ 1625], loss: 0.976, per_step_time: 1473ms, lr: 8.029945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:46,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.42963 samples/s/p 1:57:40 } +2024-07-25 23:14:49,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 85/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 8.024606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:49,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43194 samples/s/p 1:57:34 } +2024-07-25 23:14:52,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 87/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 8.019269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:52,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43655 samples/s/p 1:57:25 } +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 89/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 8.013937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:55,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.5% |███████████████████████████████████ | 5.43532 samples/s/p 1:57:24 } +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 91/ 1625], loss: 0.993, per_step_time: 1472ms, lr: 8.008599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:14:58,374 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43163 samples/s/p 1:57:26 } +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 93/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 8.003266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:01,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43460 samples/s/p 1:57:19 } +2024-07-25 23:15:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 95/ 1625], loss: 1.204, per_step_time: 1468ms, lr: 7.997937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:04,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.44680 samples/s/p 1:57:00 } +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 97/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 7.992605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:07,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43493 samples/s/p 1:57:13 } +2024-07-25 23:15:10,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 99/ 1625], loss: 1.325, per_step_time: 1472ms, lr: 7.987275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:10,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43341 samples/s/p 1:57:12 } +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 101/ 1625], loss: 0.903, per_step_time: 1473ms, lr: 7.981951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:13,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.42940 samples/s/p 1:57:14 } +2024-07-25 23:15:16,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 103/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 7.976621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:16,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43714 samples/s/p 1:57:01 } +2024-07-25 23:15:19,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 105/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 7.9713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:19,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.6% |███████████████████████████████████ | 5.43397 samples/s/p 1:57:02 } +2024-07-25 23:15:21,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 107/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 7.965976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43775 samples/s/p 1:56:54 } +2024-07-25 23:15:24,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 109/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 7.960652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:24,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43066 samples/s/p 1:57:00 } +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 111/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 7.955334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:27,878 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.44120 samples/s/p 1:56:44 } +2024-07-25 23:15:30,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 113/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.950014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:30,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43742 samples/s/p 1:56:46 } +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 115/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 7.944696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:33,776 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43887 samples/s/p 1:56:41 } +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 117/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 7.93938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:36,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43535 samples/s/p 1:56:43 } +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 119/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 7.934065e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:39,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.43446 samples/s/p 1:56:41 } +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 121/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 7.928752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:42,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.7% |███████████████████████████████████ | 5.42759 samples/s/p 1:56:47 } +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 123/ 1625], loss: 1.200, per_step_time: 1470ms, lr: 7.923439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:45,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44113 samples/s/p 1:56:26 } +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 125/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.918128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:48,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.44012 samples/s/p 1:56:25 } +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 127/ 1625], loss: 1.352, per_step_time: 1472ms, lr: 7.912819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:51,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43380 samples/s/p 1:56:30 } +2024-07-25 23:15:54,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 129/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 7.907511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:54,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43044 samples/s/p 1:56:31 } +2024-07-25 23:15:57,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 131/ 1625], loss: 1.145, per_step_time: 1473ms, lr: 7.902204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:15:57,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43064 samples/s/p 1:56:28 } +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 133/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 7.8969015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:00,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43832 samples/s/p 1:56:15 } +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 135/ 1625], loss: 1.298, per_step_time: 1471ms, lr: 7.8915955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:03,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43805 samples/s/p 1:56:13 } +2024-07-25 23:16:06,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 137/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 7.886293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:06,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.8% |███████████████████████████████████ | 5.43722 samples/s/p 1:56:11 } +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 139/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 7.880994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:09,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43490 samples/s/p 1:56:11 } +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 141/ 1625], loss: 0.940, per_step_time: 1472ms, lr: 7.875692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:12,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43456 samples/s/p 1:56:08 } +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 143/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 7.870396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:15,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44055 samples/s/p 1:55:58 } +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 145/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.8651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:18,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.44009 samples/s/p 1:55:55 } +2024-07-25 23:16:20,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 147/ 1625], loss: 1.226, per_step_time: 1473ms, lr: 7.859801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:20,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.42821 samples/s/p 1:56:08 } +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 149/ 1625], loss: 0.906, per_step_time: 1470ms, lr: 7.85451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:23,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43883 samples/s/p 1:55:51 } +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 151/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 7.8492185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:26,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43626 samples/s/p 1:55:51 } +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 153/ 1625], loss: 1.019, per_step_time: 1471ms, lr: 7.843923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:29,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 70.9% |███████████████████████████████████ | 5.43478 samples/s/p 1:55:50 } +2024-07-25 23:16:32,784 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 155/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 7.838637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:32,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43946 samples/s/p 1:55:41 } +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 157/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 7.833349e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:35,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43483 samples/s/p 1:55:44 } +2024-07-25 23:16:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 159/ 1625], loss: 1.267, per_step_time: 1471ms, lr: 7.828062e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:38,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43825 samples/s/p 1:55:37 } +2024-07-25 23:16:41,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 161/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 7.822776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:41,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43765 samples/s/p 1:55:35 } +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 163/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 7.817492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:44,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43384 samples/s/p 1:55:37 } +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 165/ 1625], loss: 1.167, per_step_time: 1469ms, lr: 7.812209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:47,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.44534 samples/s/p 1:55:19 } +2024-07-25 23:16:50,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 7.806928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:50,481 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43732 samples/s/p 1:55:26 } +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 169/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 7.801648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:53,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.0% |███████████████████████████████████ | 5.43023 samples/s/p 1:55:33 } +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 171/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 7.7963705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43614 samples/s/p 1:55:22 } +2024-07-25 23:16:59,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 173/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 7.791093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:16:59,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.42942 samples/s/p 1:55:28 } +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 175/ 1625], loss: 1.149, per_step_time: 1469ms, lr: 7.785818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:02,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44378 samples/s/p 1:55:06 } +2024-07-25 23:17:05,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 177/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 7.780546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:05,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44128 samples/s/p 1:55:07 } +2024-07-25 23:17:08,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 179/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 7.77527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:08,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43819 samples/s/p 1:55:08 } +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 181/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 7.77e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:11,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44159 samples/s/p 1:55:00 } +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 183/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.764732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:14,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.44021 samples/s/p 1:54:59 } +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 185/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 7.7594605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:17,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.1% |███████████████████████████████████ | 5.43992 samples/s/p 1:54:57 } +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 187/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.754196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:19,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44016 samples/s/p 1:54:53 } +2024-07-25 23:17:22,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 189/ 1625], loss: 1.061, per_step_time: 1473ms, lr: 7.748931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:22,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43077 samples/s/p 1:55:02 } +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 191/ 1625], loss: 1.170, per_step_time: 1469ms, lr: 7.743663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:25,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.44467 samples/s/p 1:54:42 } +2024-07-25 23:17:28,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 193/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 7.738405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:28,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43022 samples/s/p 1:54:57 } +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 195/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 7.733143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:31,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43261 samples/s/p 1:54:51 } +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 197/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 7.72788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43070 samples/s/p 1:54:51 } +2024-07-25 23:17:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 199/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 7.722625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43814 samples/s/p 1:54:38 } +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 201/ 1625], loss: 1.314, per_step_time: 1472ms, lr: 7.717367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:40,632 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43183 samples/s/p 1:54:43 } +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 203/ 1625], loss: 1.261, per_step_time: 1472ms, lr: 7.712112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:43,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.2% |███████████████████████████████████ | 5.43420 samples/s/p 1:54:37 } +2024-07-25 23:17:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 205/ 1625], loss: 0.943, per_step_time: 1471ms, lr: 7.706858e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:46,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43558 samples/s/p 1:54:33 } +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 207/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 7.701605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:49,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43250 samples/s/p 1:54:34 } +2024-07-25 23:17:52,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 209/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 7.696354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:52,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.42952 samples/s/p 1:54:35 } +2024-07-25 23:17:55,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 211/ 1625], loss: 1.014, per_step_time: 1477ms, lr: 7.691104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:55,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.41421 samples/s/p 1:54:51 } +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 213/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 7.685856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:17:58,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43323 samples/s/p 1:54:24 } +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 215/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 7.680609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:01,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.44180 samples/s/p 1:54:10 } +2024-07-25 23:18:04,252 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 217/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 7.675363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:04,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43520 samples/s/p 1:54:16 } +2024-07-25 23:18:07,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 219/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 7.67012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:07,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.3% |███████████████████████████████████ | 5.43427 samples/s/p 1:54:14 } +2024-07-25 23:18:10,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 221/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 7.664877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:10,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43882 samples/s/p 1:54:05 } +2024-07-25 23:18:13,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 223/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 7.659636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:13,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.42910 samples/s/p 1:54:14 } +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 225/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 7.654396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:16,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43919 samples/s/p 1:53:59 } +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 227/ 1625], loss: 0.939, per_step_time: 1471ms, lr: 7.649158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:19,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43758 samples/s/p 1:53:58 } +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 229/ 1625], loss: 0.986, per_step_time: 1482ms, lr: 7.643921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:21,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.39494 samples/s/p 1:54:49 } +2024-07-25 23:18:24,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 231/ 1625], loss: 1.192, per_step_time: 1470ms, lr: 7.638689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:24,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44078 samples/s/p 1:53:48 } +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 233/ 1625], loss: 1.245, per_step_time: 1470ms, lr: 7.6334545e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:27,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.44055 samples/s/p 1:53:45 } +2024-07-25 23:18:30,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 235/ 1625], loss: 1.165, per_step_time: 1472ms, lr: 7.628219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:30,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.4% |███████████████████████████████████ | 5.43231 samples/s/p 1:53:53 } +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 237/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 7.6229917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:33,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43588 samples/s/p 1:53:45 } +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 239/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 7.617762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:36,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43470 samples/s/p 1:53:44 } +2024-07-25 23:18:39,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 241/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 7.6125307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:39,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43289 samples/s/p 1:53:43 } +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 243/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 7.607307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:42,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43289 samples/s/p 1:53:40 } +2024-07-25 23:18:45,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 245/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.602082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:45,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43264 samples/s/p 1:53:38 } +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 247/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 7.5968583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:48,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43940 samples/s/p 1:53:26 } +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 249/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 7.5916355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:51,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.44015 samples/s/p 1:53:22 } +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 251/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.586415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:54,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.5% |███████████████████████████████████ | 5.43810 samples/s/p 1:53:22 } +2024-07-25 23:18:57,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 253/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 7.581196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:18:57,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43608 samples/s/p 1:53:21 } +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 255/ 1625], loss: 1.045, per_step_time: 1470ms, lr: 7.575978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:00,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44111 samples/s/p 1:53:12 } +2024-07-25 23:19:03,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 257/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 7.5707617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:03,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44064 samples/s/p 1:53:10 } +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 259/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 7.5655466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43204 samples/s/p 1:53:18 } +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 261/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 7.5603334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:09,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43486 samples/s/p 1:53:11 } +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 263/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 7.555121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:12,126 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43804 samples/s/p 1:53:04 } +2024-07-25 23:19:15,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 265/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 7.54991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.44000 samples/s/p 1:52:59 } +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 267/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 7.5447015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:18,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.6% |███████████████████████████████████ | 5.43473 samples/s/p 1:53:03 } +2024-07-25 23:19:20,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 269/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.5394933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:20,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43227 samples/s/p 1:53:03 } +2024-07-25 23:19:23,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 271/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.5342878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:23,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43600 samples/s/p 1:52:55 } +2024-07-25 23:19:26,878 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 273/ 1625], loss: 1.193, per_step_time: 1471ms, lr: 7.529083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:26,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43573 samples/s/p 1:52:52 } +2024-07-25 23:19:29,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 275/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 7.5238827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:29,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43882 samples/s/p 1:52:46 } +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 277/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 7.518678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:32,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43811 samples/s/p 1:52:44 } +2024-07-25 23:19:35,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 279/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 7.513478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:35,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43562 samples/s/p 1:52:44 } +2024-07-25 23:19:38,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 281/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 7.508282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:38,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43344 samples/s/p 1:52:44 } +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 283/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 7.5030853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:41,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.7% |███████████████████████████████████ | 5.43765 samples/s/p 1:52:35 } +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 285/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 7.4978893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:44,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43969 samples/s/p 1:52:30 } +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 287/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 7.492694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:47,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43869 samples/s/p 1:52:28 } +2024-07-25 23:19:50,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 289/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 7.4875015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:50,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43333 samples/s/p 1:52:32 } +2024-07-25 23:19:53,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 291/ 1625], loss: 1.135, per_step_time: 1475ms, lr: 7.4823097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:53,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42139 samples/s/p 1:52:44 } +2024-07-25 23:19:56,388 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 293/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 7.4771206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:56,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43112 samples/s/p 1:52:29 } +2024-07-25 23:19:59,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 295/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 7.471932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:19:59,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.44096 samples/s/p 1:52:14 } +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 297/ 1625], loss: 1.064, per_step_time: 1473ms, lr: 7.4667446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:02,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.42845 samples/s/p 1:52:26 } +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 299/ 1625], loss: 1.055, per_step_time: 1471ms, lr: 7.4615587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:05,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.8% |███████████████████████████████████ | 5.43842 samples/s/p 1:52:11 } +2024-07-25 23:20:08,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 301/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 7.456376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:08,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43573 samples/s/p 1:52:11 } +2024-07-25 23:20:11,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 303/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 7.4511927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:11,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43441 samples/s/p 1:52:10 } +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 305/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 7.446012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:14,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43559 samples/s/p 1:52:06 } +2024-07-25 23:20:17,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 307/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 7.4408326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:17,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42760 samples/s/p 1:52:12 } +2024-07-25 23:20:20,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 309/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 7.435654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:20,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.42757 samples/s/p 1:52:10 } +2024-07-25 23:20:22,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 311/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 7.430478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:22,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43752 samples/s/p 1:51:54 } +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 313/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 7.4253053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:25,900 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43766 samples/s/p 1:51:51 } +2024-07-25 23:20:28,848 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 315/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 7.4201294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:28,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 71.9% |███████████████████████████████████ | 5.43904 samples/s/p 1:51:47 } +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 317/ 1625], loss: 1.017, per_step_time: 1472ms, lr: 7.4149575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:31,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.43452 samples/s/p 1:51:49 } +2024-07-25 23:20:34,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 319/ 1625], loss: 0.999, per_step_time: 1469ms, lr: 7.4097893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:34,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.44286 samples/s/p 1:51:36 } +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 321/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 7.4046175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:37,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.42993 samples/s/p 1:51:49 } +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 323/ 1625], loss: 1.174, per_step_time: 1474ms, lr: 7.39945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:40,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |███████████████████████████████████ | 5.42571 samples/s/p 1:51:51 } +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 325/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 7.394287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:43,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43422 samples/s/p 1:51:38 } +2024-07-25 23:20:46,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 327/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 7.389119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:46,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43678 samples/s/p 1:51:32 } +2024-07-25 23:20:49,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 329/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 7.3839587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:49,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43313 samples/s/p 1:51:33 } +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 331/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 7.3787974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:52,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43401 samples/s/p 1:51:29 } +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 333/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 7.373637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:55,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.0% |████████████████████████████████████ | 5.43310 samples/s/p 1:51:27 } +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 335/ 1625], loss: 1.035, per_step_time: 1471ms, lr: 7.368479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:20:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43520 samples/s/p 1:51:22 } +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 337/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 7.363322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:01,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43919 samples/s/p 1:51:14 } +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 339/ 1625], loss: 1.283, per_step_time: 1470ms, lr: 7.3581655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:04,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43872 samples/s/p 1:51:12 } +2024-07-25 23:21:07,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 341/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 7.353012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:07,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43870 samples/s/p 1:51:09 } +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 343/ 1625], loss: 1.290, per_step_time: 1473ms, lr: 7.347859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:10,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.42922 samples/s/p 1:51:17 } +2024-07-25 23:21:13,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 345/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 7.342708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43194 samples/s/p 1:51:11 } +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 347/ 1625], loss: 1.077, per_step_time: 1469ms, lr: 7.337559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:16,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.44259 samples/s/p 1:50:55 } +2024-07-25 23:21:19,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 349/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 7.3324104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:19,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.1% |████████████████████████████████████ | 5.43160 samples/s/p 1:51:06 } +2024-07-25 23:21:21,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 351/ 1625], loss: 1.164, per_step_time: 1469ms, lr: 7.3272636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:21,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44444 samples/s/p 1:50:47 } +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 353/ 1625], loss: 1.048, per_step_time: 1472ms, lr: 7.3221186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:24,913 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43160 samples/s/p 1:51:00 } +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 355/ 1625], loss: 1.153, per_step_time: 1469ms, lr: 7.3169754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:27,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44221 samples/s/p 1:50:44 } +2024-07-25 23:21:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 7.311836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:30,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43407 samples/s/p 1:50:51 } +2024-07-25 23:21:33,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 359/ 1625], loss: 1.053, per_step_time: 1476ms, lr: 7.3066926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:33,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.41983 samples/s/p 1:51:05 } +2024-07-25 23:21:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 361/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 7.3015535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:36,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.44132 samples/s/p 1:50:36 } +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 363/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 7.296419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:39,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43705 samples/s/p 1:50:38 } +2024-07-25 23:21:42,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 365/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 7.29128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:42,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.2% |████████████████████████████████████ | 5.43546 samples/s/p 1:50:37 } +2024-07-25 23:21:45,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 367/ 1625], loss: 1.058, per_step_time: 1470ms, lr: 7.2861453e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:45,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43901 samples/s/p 1:50:30 } +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 369/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 7.2810158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:48,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43812 samples/s/p 1:50:28 } +2024-07-25 23:21:51,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 371/ 1625], loss: 1.237, per_step_time: 1469ms, lr: 7.275881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:51,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44455 samples/s/p 1:50:17 } +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 373/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 7.2707544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:54,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43400 samples/s/p 1:50:27 } +2024-07-25 23:21:57,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 375/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 7.2656258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:21:57,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43479 samples/s/p 1:50:23 } +2024-07-25 23:22:00,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 377/ 1625], loss: 1.169, per_step_time: 1469ms, lr: 7.2604957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:00,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.44232 samples/s/p 1:50:11 } +2024-07-25 23:22:03,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 379/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 7.255374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:03,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43308 samples/s/p 1:50:20 } +2024-07-25 23:22:06,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 381/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 7.25025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:06,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.3% |████████████████████████████████████ | 5.43249 samples/s/p 1:50:17 } +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 383/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 7.245127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:09,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43717 samples/s/p 1:50:09 } +2024-07-25 23:22:12,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 385/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 7.2400067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:12,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43243 samples/s/p 1:50:12 } +2024-07-25 23:22:15,069 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 387/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 7.2348876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:15,070 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43271 samples/s/p 1:50:08 } +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 389/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 7.2297703e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:18,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43919 samples/s/p 1:49:58 } +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 391/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 7.2246526e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:20,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43806 samples/s/p 1:49:56 } +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 393/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 7.219539e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:23,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.42679 samples/s/p 1:50:07 } +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 395/ 1625], loss: 0.985, per_step_time: 1471ms, lr: 7.214425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:26,873 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43520 samples/s/p 1:49:54 } +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 397/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 7.209314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:29,823 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.4% |████████████████████████████████████ | 5.43619 samples/s/p 1:49:49 } +2024-07-25 23:22:32,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 399/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 7.2042035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:32,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43350 samples/s/p 1:49:50 } +2024-07-25 23:22:35,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 401/ 1625], loss: 1.206, per_step_time: 1475ms, lr: 7.199098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:35,732 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.42336 samples/s/p 1:49:59 } +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 403/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 7.1939876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:38,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43156 samples/s/p 1:49:46 } +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 405/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 7.1888826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:41,633 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43775 samples/s/p 1:49:36 } +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 407/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 7.183781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:44,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43693 samples/s/p 1:49:34 } +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 409/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 7.1786762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:47,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43114 samples/s/p 1:49:38 } +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 411/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 7.1735753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:50,486 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43679 samples/s/p 1:49:28 } +2024-07-25 23:22:53,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 413/ 1625], loss: 1.243, per_step_time: 1470ms, lr: 7.168479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:53,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.5% |████████████████████████████████████ | 5.43909 samples/s/p 1:49:22 } +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 415/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 7.163378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:56,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43712 samples/s/p 1:49:22 } +2024-07-25 23:22:59,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 417/ 1625], loss: 1.249, per_step_time: 1470ms, lr: 7.158285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:22:59,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43958 samples/s/p 1:49:16 } +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 419/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 7.15319e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:02,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43340 samples/s/p 1:49:20 } +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 421/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 7.148094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:05,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43459 samples/s/p 1:49:16 } +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 423/ 1625], loss: 1.299, per_step_time: 1470ms, lr: 7.1430045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:08,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43944 samples/s/p 1:49:07 } +2024-07-25 23:23:11,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 425/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 7.137915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:11,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43988 samples/s/p 1:49:04 } +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 427/ 1625], loss: 1.171, per_step_time: 1470ms, lr: 7.1328236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:14,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43859 samples/s/p 1:49:02 } +2024-07-25 23:23:17,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 429/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 7.127739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:17,030 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.6% |████████████████████████████████████ | 5.43747 samples/s/p 1:49:01 } +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 431/ 1625], loss: 1.294, per_step_time: 1473ms, lr: 7.1226536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:19,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42973 samples/s/p 1:49:07 } +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 433/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 7.117569e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:22,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43624 samples/s/p 1:48:56 } +2024-07-25 23:23:25,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 435/ 1625], loss: 1.017, per_step_time: 1471ms, lr: 7.1124873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:25,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43804 samples/s/p 1:48:51 } +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 437/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 7.1074064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:28,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43725 samples/s/p 1:48:49 } +2024-07-25 23:23:31,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 439/ 1625], loss: 1.191, per_step_time: 1469ms, lr: 7.102327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:31,779 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.44228 samples/s/p 1:48:40 } +2024-07-25 23:23:34,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 441/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 7.097249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:34,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43565 samples/s/p 1:48:45 } +2024-07-25 23:23:37,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 443/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 7.092173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:37,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.43740 samples/s/p 1:48:40 } +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 445/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 7.087101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:40,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.7% |████████████████████████████████████ | 5.42887 samples/s/p 1:48:48 } +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 447/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 7.082025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:43,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43636 samples/s/p 1:48:36 } +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 449/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 7.076954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:46,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43813 samples/s/p 1:48:31 } +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 451/ 1625], loss: 1.398, per_step_time: 1472ms, lr: 7.0718866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:49,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43300 samples/s/p 1:48:34 } +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 453/ 1625], loss: 1.149, per_step_time: 1471ms, lr: 7.066815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:52,436 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43573 samples/s/p 1:48:28 } +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 455/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 7.061751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:55,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43568 samples/s/p 1:48:25 } +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 457/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 7.0566857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:23:58,336 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43691 samples/s/p 1:48:20 } +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 459/ 1625], loss: 1.130, per_step_time: 1472ms, lr: 7.0516194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:01,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43206 samples/s/p 1:48:23 } +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 461/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 7.0465603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:04,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43300 samples/s/p 1:48:19 } +2024-07-25 23:24:07,188 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 463/ 1625], loss: 1.203, per_step_time: 1470ms, lr: 7.0415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:07,189 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.8% |████████████████████████████████████ | 5.43876 samples/s/p 1:48:09 } +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 465/ 1625], loss: 1.064, per_step_time: 1470ms, lr: 7.0364367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:10,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43981 samples/s/p 1:48:05 } +2024-07-25 23:24:13,087 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 467/ 1625], loss: 1.256, per_step_time: 1471ms, lr: 7.0313827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:13,088 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43497 samples/s/p 1:48:08 } +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 469/ 1625], loss: 1.008, per_step_time: 1472ms, lr: 7.026327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:16,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43213 samples/s/p 1:48:08 } +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 471/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 7.0212723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:18,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43456 samples/s/p 1:48:02 } +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 473/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 7.016219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:21,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43559 samples/s/p 1:47:58 } +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 475/ 1625], loss: 1.131, per_step_time: 1470ms, lr: 7.0111682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:24,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43998 samples/s/p 1:47:50 } +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 477/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 7.0061183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:27,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43092 samples/s/p 1:47:58 } +2024-07-25 23:24:30,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 479/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 7.00107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:30,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 72.9% |████████████████████████████████████ | 5.43366 samples/s/p 1:47:52 } +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 481/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 6.996024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:33,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43164 samples/s/p 1:47:51 } +2024-07-25 23:24:36,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 483/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 6.9909815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:36,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43108 samples/s/p 1:47:49 } +2024-07-25 23:24:39,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 485/ 1625], loss: 1.283, per_step_time: 1474ms, lr: 6.985936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:39,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42720 samples/s/p 1:47:51 } +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 487/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 6.980893e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:42,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43376 samples/s/p 1:47:40 } +2024-07-25 23:24:45,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 489/ 1625], loss: 1.295, per_step_time: 1471ms, lr: 6.975856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:45,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43500 samples/s/p 1:47:35 } +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 491/ 1625], loss: 1.066, per_step_time: 1473ms, lr: 6.970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:48,513 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42871 samples/s/p 1:47:40 } +2024-07-25 23:24:51,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 493/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 6.965778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:51,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.43389 samples/s/p 1:47:31 } +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 495/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 6.9607454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:54,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.0% |████████████████████████████████████ | 5.42999 samples/s/p 1:47:33 } +2024-07-25 23:24:57,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 497/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 6.955708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:24:57,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43250 samples/s/p 1:47:27 } +2024-07-25 23:25:00,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 499/ 1625], loss: 1.284, per_step_time: 1470ms, lr: 6.950678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:00,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43968 samples/s/p 1:47:15 } +2024-07-25 23:25:03,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 501/ 1625], loss: 0.971, per_step_time: 1472ms, lr: 6.9456473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:03,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43162 samples/s/p 1:47:22 } +2024-07-25 23:25:06,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 503/ 1625], loss: 1.229, per_step_time: 1473ms, lr: 6.9406155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:06,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43004 samples/s/p 1:47:21 } +2024-07-25 23:25:09,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 505/ 1625], loss: 1.149, per_step_time: 1470ms, lr: 6.9355906e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:09,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43888 samples/s/p 1:47:07 } +2024-07-25 23:25:12,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 507/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 6.9305643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:12,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43278 samples/s/p 1:47:12 } +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 509/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 6.9255375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:15,075 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43914 samples/s/p 1:47:01 } +2024-07-25 23:25:18,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 511/ 1625], loss: 1.063, per_step_time: 1471ms, lr: 6.920517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:18,026 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.1% |████████████████████████████████████ | 5.43543 samples/s/p 1:47:03 } +2024-07-25 23:25:20,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 513/ 1625], loss: 1.141, per_step_time: 1476ms, lr: 6.9154958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:20,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.41927 samples/s/p 1:47:19 } +2024-07-25 23:25:23,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 515/ 1625], loss: 1.279, per_step_time: 1472ms, lr: 6.910476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:23,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43148 samples/s/p 1:47:01 } +2024-07-25 23:25:26,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 517/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 6.905458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:26,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43048 samples/s/p 1:47:00 } +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 519/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 6.900441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:29,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43896 samples/s/p 1:46:47 } +2024-07-25 23:25:32,791 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 521/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 6.8954255e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:32,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43960 samples/s/p 1:46:43 } +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 523/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 6.890413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:35,745 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43002 samples/s/p 1:46:51 } +2024-07-25 23:25:38,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 525/ 1625], loss: 1.388, per_step_time: 1472ms, lr: 6.885401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:38,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43239 samples/s/p 1:46:46 } +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 527/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 6.880391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:41,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.2% |████████████████████████████████████ | 5.43185 samples/s/p 1:46:43 } +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 529/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 6.8753825e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:44,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43428 samples/s/p 1:46:37 } +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 531/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 6.870375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:47,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43155 samples/s/p 1:46:38 } +2024-07-25 23:25:50,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 533/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 6.8653726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:50,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43335 samples/s/p 1:46:33 } +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 535/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 6.860366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:53,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43585 samples/s/p 1:46:27 } +2024-07-25 23:25:56,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 537/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 6.8553636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:56,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43509 samples/s/p 1:46:25 } +2024-07-25 23:25:59,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 539/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 6.8503664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:25:59,359 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43313 samples/s/p 1:46:24 } +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 541/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 6.8453637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:02,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43902 samples/s/p 1:46:14 } +2024-07-25 23:26:05,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 543/ 1625], loss: 1.019, per_step_time: 1471ms, lr: 6.840369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:05,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.3% |████████████████████████████████████ | 5.43829 samples/s/p 1:46:12 } +2024-07-25 23:26:08,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 545/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 6.835374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:08,207 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43674 samples/s/p 1:46:11 } +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 547/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 6.8303757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:11,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43196 samples/s/p 1:46:14 } +2024-07-25 23:26:14,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 549/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 6.825386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:14,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43579 samples/s/p 1:46:06 } +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 551/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 6.8203954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:17,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43596 samples/s/p 1:46:03 } +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 553/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.815403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:20,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43275 samples/s/p 1:46:04 } +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 555/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 6.810418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:22,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43703 samples/s/p 1:45:56 } +2024-07-25 23:26:25,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 557/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 6.8054314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:25,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43780 samples/s/p 1:45:52 } +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 559/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 6.800447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:28,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.4% |████████████████████████████████████ | 5.43422 samples/s/p 1:45:53 } +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 561/ 1625], loss: 1.121, per_step_time: 1473ms, lr: 6.795464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:31,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.42909 samples/s/p 1:45:56 } +2024-07-25 23:26:34,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 563/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 6.790483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:34,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43488 samples/s/p 1:45:47 } +2024-07-25 23:26:37,720 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 565/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 6.785503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:37,721 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43371 samples/s/p 1:45:45 } +2024-07-25 23:26:40,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 567/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 6.780525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:40,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43118 samples/s/p 1:45:45 } +2024-07-25 23:26:43,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 569/ 1625], loss: 1.236, per_step_time: 1472ms, lr: 6.7755473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:43,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43313 samples/s/p 1:45:40 } +2024-07-25 23:26:46,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 571/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 6.770573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:46,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43319 samples/s/p 1:45:37 } +2024-07-25 23:26:49,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 573/ 1625], loss: 1.033, per_step_time: 1472ms, lr: 6.7655997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:49,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43468 samples/s/p 1:45:32 } +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 575/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.7606275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:52,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.5% |████████████████████████████████████ | 5.43556 samples/s/p 1:45:28 } +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 577/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 6.755657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:55,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43451 samples/s/p 1:45:26 } +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 579/ 1625], loss: 1.231, per_step_time: 1471ms, lr: 6.7506894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:26:58,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43523 samples/s/p 1:45:23 } +2024-07-25 23:27:01,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 581/ 1625], loss: 1.042, per_step_time: 1473ms, lr: 6.7457217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:01,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43008 samples/s/p 1:45:26 } +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 583/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 6.74076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:04,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.42958 samples/s/p 1:45:23 } +2024-07-25 23:27:07,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 585/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 6.735793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:07,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43427 samples/s/p 1:45:15 } +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 587/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 6.730834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:10,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43570 samples/s/p 1:45:10 } +2024-07-25 23:27:13,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 589/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.725873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:13,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43196 samples/s/p 1:45:12 } +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 591/ 1625], loss: 1.129, per_step_time: 1482ms, lr: 6.720911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:16,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.39672 samples/s/p 1:45:50 } +2024-07-25 23:27:19,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 593/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 6.715957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:19,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.6% |████████████████████████████████████ | 5.43527 samples/s/p 1:45:02 } +2024-07-25 23:27:22,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 595/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 6.7110013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:22,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43477 samples/s/p 1:45:00 } +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 597/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 6.7060473e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:24,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43365 samples/s/p 1:44:58 } +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 599/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 6.701095e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:27,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43957 samples/s/p 1:44:48 } +2024-07-25 23:27:30,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 601/ 1625], loss: 1.262, per_step_time: 1471ms, lr: 6.6961447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:30,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43760 samples/s/p 1:44:48 } +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 603/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 6.691195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:33,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43915 samples/s/p 1:44:43 } +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 605/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 6.686248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:36,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43589 samples/s/p 1:44:44 } +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 607/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 6.681302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:39,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.43674 samples/s/p 1:44:40 } +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 609/ 1625], loss: 1.108, per_step_time: 1474ms, lr: 6.6763573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:42,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.7% |████████████████████████████████████ | 5.42625 samples/s/p 1:44:49 } +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 611/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 6.6714156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:45,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.44056 samples/s/p 1:44:29 } +2024-07-25 23:27:48,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 613/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 6.6664743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:48,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43542 samples/s/p 1:44:32 } +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 615/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 6.661535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:51,517 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43757 samples/s/p 1:44:27 } +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 617/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 6.6565976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:54,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43481 samples/s/p 1:44:27 } +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 619/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 6.651661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:27:57,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43225 samples/s/p 1:44:27 } +2024-07-25 23:28:00,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 621/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 6.646727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:00,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43465 samples/s/p 1:44:22 } +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 623/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 6.6417933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:03,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43432 samples/s/p 1:44:19 } +2024-07-25 23:28:06,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 625/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 6.6368652e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:06,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.8% |████████████████████████████████████ | 5.43792 samples/s/p 1:44:12 } +2024-07-25 23:28:09,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 627/ 1625], loss: 1.269, per_step_time: 1474ms, lr: 6.631933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:09,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42447 samples/s/p 1:44:24 } +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 629/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 6.627005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:12,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43701 samples/s/p 1:44:07 } +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 631/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 6.6220814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:15,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43692 samples/s/p 1:44:04 } +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 633/ 1625], loss: 1.245, per_step_time: 1473ms, lr: 6.6171565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:18,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42848 samples/s/p 1:44:11 } +2024-07-25 23:28:21,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 635/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 6.612231e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:21,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43486 samples/s/p 1:44:01 } +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 637/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 6.6073126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:23,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43449 samples/s/p 1:43:58 } +2024-07-25 23:28:26,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 639/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 6.602392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:26,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.43628 samples/s/p 1:43:53 } +2024-07-25 23:28:29,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 641/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 6.5974746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:29,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 73.9% |████████████████████████████████████ | 5.42894 samples/s/p 1:43:59 } +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 643/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 6.592558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:32,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43029 samples/s/p 1:43:54 } +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 645/ 1625], loss: 0.951, per_step_time: 1473ms, lr: 6.587644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:35,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43048 samples/s/p 1:43:51 } +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 647/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.5827303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:38,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43524 samples/s/p 1:43:43 } +2024-07-25 23:28:41,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 649/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 6.5778186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:41,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |████████████████████████████████████ | 5.43468 samples/s/p 1:43:40 } +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 651/ 1625], loss: 1.034, per_step_time: 1473ms, lr: 6.5729087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:44,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43056 samples/s/p 1:43:42 } +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 653/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 6.5680006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:47,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43651 samples/s/p 1:43:32 } +2024-07-25 23:28:50,550 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 655/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 6.5630943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:50,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43917 samples/s/p 1:43:26 } +2024-07-25 23:28:53,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 657/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 6.5581894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:53,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.0% |█████████████████████████████████████ | 5.43644 samples/s/p 1:43:27 } +2024-07-25 23:28:56,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 659/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 6.5532854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:56,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43617 samples/s/p 1:43:24 } +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 661/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 6.548384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:28:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43147 samples/s/p 1:43:26 } +2024-07-25 23:29:02,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 663/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 6.543484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:02,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43029 samples/s/p 1:43:25 } +2024-07-25 23:29:05,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 665/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 6.538586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:05,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43418 samples/s/p 1:43:17 } +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 667/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 6.533689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43172 samples/s/p 1:43:17 } +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 669/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 6.5287973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:11,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43593 samples/s/p 1:43:09 } +2024-07-25 23:29:14,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 671/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 6.5239014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:14,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43449 samples/s/p 1:43:08 } +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 673/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 6.5190097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:17,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.1% |█████████████████████████████████████ | 5.43169 samples/s/p 1:43:08 } +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 675/ 1625], loss: 1.227, per_step_time: 1471ms, lr: 6.514122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:20,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43511 samples/s/p 1:43:02 } +2024-07-25 23:29:23,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 677/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 6.5092313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:23,016 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43658 samples/s/p 1:42:57 } +2024-07-25 23:29:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 679/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.5043446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:25,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43789 samples/s/p 1:42:52 } +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 681/ 1625], loss: 1.126, per_step_time: 1472ms, lr: 6.4994624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:28,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43158 samples/s/p 1:42:57 } +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 683/ 1625], loss: 1.231, per_step_time: 1469ms, lr: 6.4945793e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:31,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44230 samples/s/p 1:42:42 } +2024-07-25 23:29:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 685/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 6.489697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:34,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43029 samples/s/p 1:42:52 } +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 687/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 6.4848173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:37,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.43430 samples/s/p 1:42:45 } +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 689/ 1625], loss: 1.051, per_step_time: 1470ms, lr: 6.4799387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:40,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.2% |█████████████████████████████████████ | 5.44014 samples/s/p 1:42:35 } +2024-07-25 23:29:43,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 691/ 1625], loss: 1.242, per_step_time: 1470ms, lr: 6.4750616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:43,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44073 samples/s/p 1:42:32 } +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 693/ 1625], loss: 1.130, per_step_time: 1470ms, lr: 6.470187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:46,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.44138 samples/s/p 1:42:28 } +2024-07-25 23:29:49,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 695/ 1625], loss: 1.346, per_step_time: 1471ms, lr: 6.4653136e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:49,564 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43508 samples/s/p 1:42:32 } +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 697/ 1625], loss: 1.194, per_step_time: 1474ms, lr: 6.4604415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42664 samples/s/p 1:42:39 } +2024-07-25 23:29:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 699/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.4555716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43541 samples/s/p 1:42:26 } +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 701/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 6.450704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:29:58,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43492 samples/s/p 1:42:23 } +2024-07-25 23:30:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 703/ 1625], loss: 1.145, per_step_time: 1474ms, lr: 6.4458363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.42397 samples/s/p 1:42:33 } +2024-07-25 23:30:04,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 705/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 6.4409714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.3% |█████████████████████████████████████ | 5.43370 samples/s/p 1:42:19 } +2024-07-25 23:30:07,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 707/ 1625], loss: 1.114, per_step_time: 1473ms, lr: 6.4361084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:07,285 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42908 samples/s/p 1:42:21 } +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 709/ 1625], loss: 1.002, per_step_time: 1471ms, lr: 6.4312467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:10,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43695 samples/s/p 1:42:09 } +2024-07-25 23:30:13,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 711/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 6.426387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:13,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.44098 samples/s/p 1:42:02 } +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 713/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.4215315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:16,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43515 samples/s/p 1:42:06 } +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 715/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 6.4166716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:19,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43362 samples/s/p 1:42:04 } +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 717/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 6.4118162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:22,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43456 samples/s/p 1:42:00 } +2024-07-25 23:30:24,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 719/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 6.406966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:24,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43411 samples/s/p 1:41:58 } +2024-07-25 23:30:27,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 721/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 6.4021115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:27,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.42947 samples/s/p 1:42:00 } +2024-07-25 23:30:30,891 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 723/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 6.397261e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:30,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.4% |█████████████████████████████████████ | 5.43448 samples/s/p 1:41:52 } +2024-07-25 23:30:33,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 725/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 6.3924163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:33,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43481 samples/s/p 1:41:48 } +2024-07-25 23:30:36,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 727/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 6.387567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:36,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43142 samples/s/p 1:41:49 } +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 729/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 6.382725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43313 samples/s/p 1:41:44 } +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 731/ 1625], loss: 1.114, per_step_time: 1472ms, lr: 6.3778816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43127 samples/s/p 1:41:43 } +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 733/ 1625], loss: 1.059, per_step_time: 1469ms, lr: 6.373039e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:45,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.44336 samples/s/p 1:41:27 } +2024-07-25 23:30:48,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 735/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 6.3682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:48,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43670 samples/s/p 1:41:31 } +2024-07-25 23:30:51,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 737/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 6.363362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:51,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43607 samples/s/p 1:41:29 } +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 739/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 6.358525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:54,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.5% |█████████████████████████████████████ | 5.43727 samples/s/p 1:41:25 } +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 741/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.353691e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:30:57,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43737 samples/s/p 1:41:22 } +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 743/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 6.348857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:00,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43556 samples/s/p 1:41:21 } +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 745/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 6.3440257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:03,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43596 samples/s/p 1:41:18 } +2024-07-25 23:31:06,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 747/ 1625], loss: 1.055, per_step_time: 1470ms, lr: 6.3391963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:06,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43910 samples/s/p 1:41:11 } +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 749/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 6.334368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:09,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43763 samples/s/p 1:41:10 } +2024-07-25 23:31:12,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 751/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 6.3295415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:12,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43771 samples/s/p 1:41:07 } +2024-07-25 23:31:15,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 753/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 6.324717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:15,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43464 samples/s/p 1:41:07 } +2024-07-25 23:31:18,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 755/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 6.3198936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:18,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.6% |█████████████████████████████████████ | 5.43417 samples/s/p 1:41:05 } +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 757/ 1625], loss: 1.036, per_step_time: 1470ms, lr: 6.3150756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:21,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43896 samples/s/p 1:40:57 } +2024-07-25 23:31:23,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 759/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 6.3102534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:23,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43614 samples/s/p 1:40:57 } +2024-07-25 23:31:26,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 761/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.3054354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:26,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43970 samples/s/p 1:40:50 } +2024-07-25 23:31:29,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 763/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 6.3006214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:29,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43385 samples/s/p 1:40:53 } +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 765/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 6.295804e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:32,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43265 samples/s/p 1:40:52 } +2024-07-25 23:31:35,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 767/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 6.2909953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:35,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43393 samples/s/p 1:40:47 } +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 769/ 1625], loss: 1.059, per_step_time: 1475ms, lr: 6.2861827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:38,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.42322 samples/s/p 1:40:56 } +2024-07-25 23:31:41,706 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 771/ 1625], loss: 1.341, per_step_time: 1471ms, lr: 6.2813715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:41,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.7% |█████████████████████████████████████ | 5.43547 samples/s/p 1:40:40 } +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 773/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.276566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43707 samples/s/p 1:40:35 } +2024-07-25 23:31:47,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 775/ 1625], loss: 0.939, per_step_time: 1470ms, lr: 6.27176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:47,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44094 samples/s/p 1:40:28 } +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 777/ 1625], loss: 1.034, per_step_time: 1472ms, lr: 6.2669537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:50,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43431 samples/s/p 1:40:32 } +2024-07-25 23:31:53,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 779/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.262154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:53,508 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43179 samples/s/p 1:40:32 } +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 781/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 6.2573527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:56,459 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43375 samples/s/p 1:40:27 } +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 783/ 1625], loss: 1.039, per_step_time: 1468ms, lr: 6.2525532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:31:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.44706 samples/s/p 1:40:09 } +2024-07-25 23:32:02,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 785/ 1625], loss: 1.127, per_step_time: 1471ms, lr: 6.2477557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:02,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43596 samples/s/p 1:40:19 } +2024-07-25 23:32:05,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 787/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.24296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:05,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.8% |█████████████████████████████████████ | 5.43502 samples/s/p 1:40:17 } +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 789/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 6.238167e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:08,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43472 samples/s/p 1:40:14 } +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 791/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 6.2333734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:11,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43668 samples/s/p 1:40:09 } +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 793/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 6.228583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:14,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43401 samples/s/p 1:40:09 } +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 795/ 1625], loss: 0.987, per_step_time: 1470ms, lr: 6.2237973e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:17,105 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43936 samples/s/p 1:40:00 } +2024-07-25 23:32:20,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 797/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 6.219008e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:20,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42977 samples/s/p 1:40:08 } +2024-07-25 23:32:23,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 799/ 1625], loss: 1.374, per_step_time: 1471ms, lr: 6.214222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:23,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43710 samples/s/p 1:39:57 } +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 801/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 6.2094405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:25,957 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.43867 samples/s/p 1:39:52 } +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 803/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 6.2046556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:28,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 74.9% |█████████████████████████████████████ | 5.42907 samples/s/p 1:40:00 } +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 805/ 1625], loss: 1.395, per_step_time: 1471ms, lr: 6.1998753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:31,861 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43751 samples/s/p 1:39:48 } +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 807/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 6.1950996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:34,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.42673 samples/s/p 1:39:56 } +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 809/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.19032e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:37,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43911 samples/s/p 1:39:40 } +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 811/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 6.1855476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43244 samples/s/p 1:39:44 } +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 813/ 1625], loss: 1.260, per_step_time: 1471ms, lr: 6.180774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:43,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43630 samples/s/p 1:39:37 } +2024-07-25 23:32:46,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 815/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.1759993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43337 samples/s/p 1:39:37 } +2024-07-25 23:32:49,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 817/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 6.1712317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43503 samples/s/p 1:39:33 } +2024-07-25 23:32:52,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 819/ 1625], loss: 1.368, per_step_time: 1471ms, lr: 6.1664637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:52,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.0% |█████████████████████████████████████ | 5.43792 samples/s/p 1:39:26 } +2024-07-25 23:32:55,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 821/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 6.1616947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:55,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43805 samples/s/p 1:39:23 } +2024-07-25 23:32:58,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 6.1569326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:32:58,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43731 samples/s/p 1:39:21 } +2024-07-25 23:33:01,366 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 825/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 6.1521696e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:01,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43772 samples/s/p 1:39:18 } +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 827/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 6.1474075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:04,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43413 samples/s/p 1:39:19 } +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 829/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 6.142649e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:07,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43226 samples/s/p 1:39:18 } +2024-07-25 23:33:10,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 831/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 6.13789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:10,224 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43392 samples/s/p 1:39:13 } +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 833/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 6.1331343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:13,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.43875 samples/s/p 1:39:05 } +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 835/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 6.128379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:16,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.1% |█████████████████████████████████████ | 5.44098 samples/s/p 1:39:00 } +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 837/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 6.1236265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:19,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43548 samples/s/p 1:39:03 } +2024-07-25 23:33:22,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 839/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 6.118878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:22,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43573 samples/s/p 1:38:59 } +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 841/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 6.1141263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:24,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.42993 samples/s/p 1:39:03 } +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 843/ 1625], loss: 0.900, per_step_time: 1471ms, lr: 6.109379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:27,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43537 samples/s/p 1:38:54 } +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 845/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 6.1046358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:30,877 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43447 samples/s/p 1:38:52 } +2024-07-25 23:33:33,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 847/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 6.099888e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:33,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43187 samples/s/p 1:38:52 } +2024-07-25 23:33:36,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 849/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 6.095147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:36,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43058 samples/s/p 1:38:50 } +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 851/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 6.090408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:39,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.43529 samples/s/p 1:38:42 } +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 853/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 6.085667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:42,680 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.2% |█████████████████████████████████████ | 5.44151 samples/s/p 1:38:33 } +2024-07-25 23:33:45,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 855/ 1625], loss: 1.099, per_step_time: 1470ms, lr: 6.0809325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:45,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43944 samples/s/p 1:38:32 } +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 857/ 1625], loss: 1.190, per_step_time: 1471ms, lr: 6.076197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:48,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43519 samples/s/p 1:38:34 } +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 859/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 6.071461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:51,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43845 samples/s/p 1:38:27 } +2024-07-25 23:33:54,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 861/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 6.0667317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:54,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43396 samples/s/p 1:38:29 } +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 863/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 6.0620005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:33:57,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43384 samples/s/p 1:38:26 } +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 865/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 6.0572706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:00,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43744 samples/s/p 1:38:19 } +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 867/ 1625], loss: 1.016, per_step_time: 1469ms, lr: 6.0525454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:03,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.44220 samples/s/p 1:38:11 } +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 869/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 6.0478205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:06,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.3% |█████████████████████████████████████ | 5.43672 samples/s/p 1:38:14 } +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 871/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 6.0430975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:09,226 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43934 samples/s/p 1:38:08 } +2024-07-25 23:34:12,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 873/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.038376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:12,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43523 samples/s/p 1:38:10 } +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 875/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 6.033657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:15,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43539 samples/s/p 1:38:07 } +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 877/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 6.028938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:18,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43399 samples/s/p 1:38:05 } +2024-07-25 23:34:21,030 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 879/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 6.024223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:21,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43373 samples/s/p 1:38:03 } +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 881/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 6.019508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:23,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.43520 samples/s/p 1:37:58 } +2024-07-25 23:34:26,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 883/ 1625], loss: 0.990, per_step_time: 1469ms, lr: 6.0147977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:26,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.44414 samples/s/p 1:37:46 } +2024-07-25 23:34:29,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 885/ 1625], loss: 1.224, per_step_time: 1474ms, lr: 6.0100842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:29,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.4% |█████████████████████████████████████ | 5.42725 samples/s/p 1:38:01 } +2024-07-25 23:34:32,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 887/ 1625], loss: 1.263, per_step_time: 1473ms, lr: 6.005375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:32,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42865 samples/s/p 1:37:56 } +2024-07-25 23:34:35,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 889/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 6.0006705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:35,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43678 samples/s/p 1:37:45 } +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 891/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 5.995962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:38,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43040 samples/s/p 1:37:49 } +2024-07-25 23:34:41,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 893/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 5.9912577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:41,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.42954 samples/s/p 1:37:47 } +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 895/ 1625], loss: 1.151, per_step_time: 1473ms, lr: 5.986558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:44,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43025 samples/s/p 1:37:43 } +2024-07-25 23:34:47,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 897/ 1625], loss: 1.213, per_step_time: 1471ms, lr: 5.9818544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:47,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43545 samples/s/p 1:37:34 } +2024-07-25 23:34:50,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 899/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 5.9771587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:50,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43311 samples/s/p 1:37:34 } +2024-07-25 23:34:53,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 901/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 5.9724625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:53,503 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.5% |█████████████████████████████████████ | 5.43096 samples/s/p 1:37:33 } +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 903/ 1625], loss: 1.016, per_step_time: 1471ms, lr: 5.9677636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:56,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43697 samples/s/p 1:37:24 } +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 905/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 5.963073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:34:59,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43429 samples/s/p 1:37:24 } +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 907/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 5.958381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:02,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43144 samples/s/p 1:37:24 } +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 909/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 5.9536887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:05,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43534 samples/s/p 1:37:17 } +2024-07-25 23:35:08,260 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 911/ 1625], loss: 0.999, per_step_time: 1473ms, lr: 5.9490035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:08,261 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43053 samples/s/p 1:37:19 } +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 913/ 1625], loss: 1.011, per_step_time: 1474ms, lr: 5.944317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:11,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.42607 samples/s/p 1:37:21 } +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 915/ 1625], loss: 1.147, per_step_time: 1472ms, lr: 5.9396325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:14,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.43460 samples/s/p 1:37:09 } +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 917/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 5.93495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:17,113 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.6% |█████████████████████████████████████ | 5.44396 samples/s/p 1:36:56 } +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 919/ 1625], loss: 1.008, per_step_time: 1470ms, lr: 5.930269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:20,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.44012 samples/s/p 1:36:57 } +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 921/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 5.92559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:23,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43344 samples/s/p 1:37:01 } +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 923/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.9209115e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:25,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43209 samples/s/p 1:37:00 } +2024-07-25 23:35:28,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 925/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.9162358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:28,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43402 samples/s/p 1:36:55 } +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 927/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 5.911562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:31,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43734 samples/s/p 1:36:48 } +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 929/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 5.90689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:34,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43279 samples/s/p 1:36:50 } +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 931/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 5.902219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:37,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.43184 samples/s/p 1:36:48 } +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 933/ 1625], loss: 1.223, per_step_time: 1474ms, lr: 5.897553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:40,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.7% |█████████████████████████████████████ | 5.42663 samples/s/p 1:36:51 } +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 935/ 1625], loss: 1.269, per_step_time: 1470ms, lr: 5.8928836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:43,674 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.44107 samples/s/p 1:36:32 } +2024-07-25 23:35:46,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 937/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 5.8882206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:46,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43605 samples/s/p 1:36:35 } +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 939/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 5.883558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:49,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43056 samples/s/p 1:36:38 } +2024-07-25 23:35:52,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 941/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 5.8788933e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:52,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43128 samples/s/p 1:36:34 } +2024-07-25 23:35:55,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 943/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.8742357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:55,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43755 samples/s/p 1:36:24 } +2024-07-25 23:35:58,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 945/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 5.8695773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:35:58,434 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43075 samples/s/p 1:36:29 } +2024-07-25 23:36:01,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 947/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.8649184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:01,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43794 samples/s/p 1:36:18 } +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 949/ 1625], loss: 1.222, per_step_time: 1472ms, lr: 5.8602677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:04,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.8% |█████████████████████████████████████ | 5.43312 samples/s/p 1:36:20 } +2024-07-25 23:36:07,285 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 951/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 5.8556143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:07,286 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43527 samples/s/p 1:36:15 } +2024-07-25 23:36:10,235 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 953/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 5.8509636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:10,236 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43650 samples/s/p 1:36:11 } +2024-07-25 23:36:13,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 955/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.8463143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:13,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43831 samples/s/p 1:36:06 } +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 957/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 5.8416667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:16,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43163 samples/s/p 1:36:10 } +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 959/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 5.8370215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:19,089 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43227 samples/s/p 1:36:07 } +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 961/ 1625], loss: 1.304, per_step_time: 1472ms, lr: 5.8323767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:22,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.43254 samples/s/p 1:36:03 } +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 963/ 1625], loss: 1.170, per_step_time: 1474ms, lr: 5.8277355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42658 samples/s/p 1:36:07 } +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 965/ 1625], loss: 1.222, per_step_time: 1473ms, lr: 5.8230953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:27,951 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 75.9% |█████████████████████████████████████ | 5.42934 samples/s/p 1:36:01 } +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 967/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.818457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:30,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43279 samples/s/p 1:35:54 } +2024-07-25 23:36:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 969/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 5.8138203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43858 samples/s/p 1:35:45 } +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 971/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 5.809185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.44068 samples/s/p 1:35:40 } +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 973/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 5.8045516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |█████████████████████████████████████ | 5.43712 samples/s/p 1:35:41 } +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 975/ 1625], loss: 1.077, per_step_time: 1472ms, lr: 5.799921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:42,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43307 samples/s/p 1:35:42 } +2024-07-25 23:36:45,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 977/ 1625], loss: 1.011, per_step_time: 1472ms, lr: 5.795291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:45,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43325 samples/s/p 1:35:39 } +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 979/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 5.790663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43599 samples/s/p 1:35:33 } +2024-07-25 23:36:51,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 981/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 5.78604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:51,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43337 samples/s/p 1:35:33 } +2024-07-25 23:36:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 983/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.7814163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.0% |██████████████████████████████████████ | 5.43641 samples/s/p 1:35:27 } +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 985/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 5.7767907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:36:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44132 samples/s/p 1:35:19 } +2024-07-25 23:37:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 987/ 1625], loss: 1.099, per_step_time: 1471ms, lr: 5.7721727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:00,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43696 samples/s/p 1:35:20 } +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 989/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 5.7675543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:03,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43558 samples/s/p 1:35:19 } +2024-07-25 23:37:06,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 991/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 5.7629345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:06,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43716 samples/s/p 1:35:14 } +2024-07-25 23:37:09,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 993/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 5.758322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:09,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43255 samples/s/p 1:35:16 } +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 995/ 1625], loss: 1.058, per_step_time: 1469ms, lr: 5.7537086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:12,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.44374 samples/s/p 1:35:01 } +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 997/ 1625], loss: 1.046, per_step_time: 1474ms, lr: 5.749097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:15,155 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.42702 samples/s/p 1:35:16 } +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 999/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 5.7444868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:18,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.1% |██████████████████████████████████████ | 5.43432 samples/s/p 1:35:05 } +2024-07-25 23:37:21,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1001/ 1625], loss: 1.147, per_step_time: 1470ms, lr: 5.7398797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:21,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43987 samples/s/p 1:34:57 } +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1003/ 1625], loss: 0.999, per_step_time: 1469ms, lr: 5.735274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:24,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44227 samples/s/p 1:34:51 } +2024-07-25 23:37:26,951 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1005/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 5.730669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:26,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43738 samples/s/p 1:34:53 } +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1007/ 1625], loss: 1.062, per_step_time: 1472ms, lr: 5.726067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:29,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43362 samples/s/p 1:34:54 } +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1009/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 5.7214656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:32,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.42897 samples/s/p 1:34:56 } +2024-07-25 23:37:35,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1011/ 1625], loss: 1.017, per_step_time: 1469ms, lr: 5.716867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:35,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.44236 samples/s/p 1:34:39 } +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1013/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 5.7122697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:38,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43631 samples/s/p 1:34:43 } +2024-07-25 23:37:41,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1015/ 1625], loss: 1.275, per_step_time: 1471ms, lr: 5.7076745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:41,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.2% |██████████████████████████████████████ | 5.43498 samples/s/p 1:34:41 } +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1017/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 5.7030807e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:44,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43495 samples/s/p 1:34:38 } +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1019/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 5.698489e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:47,609 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43058 samples/s/p 1:34:40 } +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1021/ 1625], loss: 1.097, per_step_time: 1471ms, lr: 5.693899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:50,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43637 samples/s/p 1:34:31 } +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1023/ 1625], loss: 1.191, per_step_time: 1471ms, lr: 5.6893105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:53,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43649 samples/s/p 1:34:28 } +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1025/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 5.684727e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:56,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.43393 samples/s/p 1:34:28 } +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1027/ 1625], loss: 0.913, per_step_time: 1474ms, lr: 5.6801396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:37:59,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42401 samples/s/p 1:34:35 } +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1029/ 1625], loss: 1.008, per_step_time: 1473ms, lr: 5.675557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:02,372 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42767 samples/s/p 1:34:28 } +2024-07-25 23:38:05,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1031/ 1625], loss: 1.226, per_step_time: 1474ms, lr: 5.670979e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:05,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.3% |██████████████████████████████████████ | 5.42655 samples/s/p 1:34:26 } +2024-07-25 23:38:08,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1033/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 5.6663994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:08,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43908 samples/s/p 1:34:10 } +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1035/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 5.6618196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:11,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43601 samples/s/p 1:34:11 } +2024-07-25 23:38:14,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1037/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 5.6572476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:14,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.44016 samples/s/p 1:34:03 } +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1039/ 1625], loss: 1.094, per_step_time: 1473ms, lr: 5.652674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43044 samples/s/p 1:34:11 } +2024-07-25 23:38:20,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1041/ 1625], loss: 1.030, per_step_time: 1471ms, lr: 5.648102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:20,078 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43713 samples/s/p 1:34:01 } +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1043/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 5.643532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:23,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43727 samples/s/p 1:33:58 } +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1045/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 5.6389636e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:25,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43549 samples/s/p 1:33:57 } +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1047/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 5.6343974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:28,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.4% |██████████████████████████████████████ | 5.43620 samples/s/p 1:33:53 } +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1049/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 5.629833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:31,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43515 samples/s/p 1:33:51 } +2024-07-25 23:38:34,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1051/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 5.6252698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:34,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43373 samples/s/p 1:33:50 } +2024-07-25 23:38:37,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1053/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 5.620709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:37,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43510 samples/s/p 1:33:45 } +2024-07-25 23:38:40,730 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1055/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 5.616151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43784 samples/s/p 1:33:39 } +2024-07-25 23:38:43,684 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1057/ 1625], loss: 0.878, per_step_time: 1473ms, lr: 5.6115937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:43,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43019 samples/s/p 1:33:44 } +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1059/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 5.607038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:46,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43592 samples/s/p 1:33:35 } +2024-07-25 23:38:49,585 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1061/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 5.602484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:49,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43581 samples/s/p 1:33:33 } +2024-07-25 23:38:52,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1063/ 1625], loss: 1.260, per_step_time: 1470ms, lr: 5.597932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:52,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.5% |██████████████████████████████████████ | 5.43981 samples/s/p 1:33:26 } +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1065/ 1625], loss: 1.174, per_step_time: 1470ms, lr: 5.593383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:55,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43990 samples/s/p 1:33:23 } +2024-07-25 23:38:58,437 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1067/ 1625], loss: 1.397, per_step_time: 1473ms, lr: 5.588834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:38:58,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42870 samples/s/p 1:33:31 } +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1069/ 1625], loss: 1.022, per_step_time: 1471ms, lr: 5.5842916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:01,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43529 samples/s/p 1:33:21 } +2024-07-25 23:39:04,344 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1071/ 1625], loss: 1.253, per_step_time: 1470ms, lr: 5.5797436e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:04,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43851 samples/s/p 1:33:15 } +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1073/ 1625], loss: 1.202, per_step_time: 1473ms, lr: 5.575201e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:07,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42978 samples/s/p 1:33:21 } +2024-07-25 23:39:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1075/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 5.570663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43573 samples/s/p 1:33:12 } +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1077/ 1625], loss: 1.080, per_step_time: 1470ms, lr: 5.566121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:13,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.43945 samples/s/p 1:33:05 } +2024-07-25 23:39:16,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1079/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 5.5615847e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:16,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.6% |██████████████████████████████████████ | 5.42990 samples/s/p 1:33:12 } +2024-07-25 23:39:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1081/ 1625], loss: 1.262, per_step_time: 1470ms, lr: 5.5570517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:19,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43967 samples/s/p 1:32:59 } +2024-07-25 23:39:22,049 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1083/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.5525184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:22,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43479 samples/s/p 1:33:01 } +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1085/ 1625], loss: 0.930, per_step_time: 1470ms, lr: 5.5479873e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:24,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.44184 samples/s/p 1:32:51 } +2024-07-25 23:39:27,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1087/ 1625], loss: 0.904, per_step_time: 1471ms, lr: 5.5434575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:27,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43686 samples/s/p 1:32:53 } +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1089/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 5.5389296e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:30,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43765 samples/s/p 1:32:50 } +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1091/ 1625], loss: 1.421, per_step_time: 1471ms, lr: 5.5344026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:33,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43658 samples/s/p 1:32:48 } +2024-07-25 23:39:36,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1093/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 5.5298788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43110 samples/s/p 1:32:50 } +2024-07-25 23:39:39,748 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1095/ 1625], loss: 1.285, per_step_time: 1471ms, lr: 5.5253563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:39,749 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.7% |██████████████████████████████████████ | 5.43666 samples/s/p 1:32:42 } +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1097/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 5.520836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:42,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43681 samples/s/p 1:32:39 } +2024-07-25 23:39:45,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1099/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.516317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:45,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43389 samples/s/p 1:32:39 } +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1101/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 5.5118003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:48,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43054 samples/s/p 1:32:39 } +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1103/ 1625], loss: 1.177, per_step_time: 1474ms, lr: 5.507285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:51,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.42630 samples/s/p 1:32:41 } +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 5.502772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:54,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43447 samples/s/p 1:32:29 } +2024-07-25 23:39:57,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1107/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 5.4982634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:39:57,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43255 samples/s/p 1:32:28 } +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1109/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 5.493752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:00,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43296 samples/s/p 1:32:25 } +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1111/ 1625], loss: 1.093, per_step_time: 1470ms, lr: 5.489244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:03,362 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43881 samples/s/p 1:32:16 } +2024-07-25 23:40:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1113/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.484741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.8% |██████████████████████████████████████ | 5.43305 samples/s/p 1:32:19 } +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1115/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 5.4802344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:09,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.44286 samples/s/p 1:32:06 } +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1117/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.475732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:12,211 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43763 samples/s/p 1:32:08 } +2024-07-25 23:40:15,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1119/ 1625], loss: 1.333, per_step_time: 1471ms, lr: 5.471234e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:15,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43539 samples/s/p 1:32:08 } +2024-07-25 23:40:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1121/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 5.466733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43237 samples/s/p 1:32:08 } +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1123/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.4622396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:21,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43686 samples/s/p 1:32:00 } +2024-07-25 23:40:24,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1125/ 1625], loss: 1.212, per_step_time: 1470ms, lr: 5.4577445e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:24,013 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43991 samples/s/p 1:31:54 } +2024-07-25 23:40:26,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1127/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 5.4532497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:26,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43794 samples/s/p 1:31:53 } +2024-07-25 23:40:29,913 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1129/ 1625], loss: 1.071, per_step_time: 1472ms, lr: 5.4487605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 76.9% |██████████████████████████████████████ | 5.43274 samples/s/p 1:31:56 } +2024-07-25 23:40:32,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1131/ 1625], loss: 1.124, per_step_time: 1473ms, lr: 5.4442717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:32,867 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43088 samples/s/p 1:31:55 } +2024-07-25 23:40:35,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1133/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 5.439784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:35,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43266 samples/s/p 1:31:50 } +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1135/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 5.4352986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:38,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43390 samples/s/p 1:31:46 } +2024-07-25 23:40:41,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1137/ 1625], loss: 1.360, per_step_time: 1470ms, lr: 5.430815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:41,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44016 samples/s/p 1:31:36 } +2024-07-25 23:40:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1139/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 5.4263337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:44,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43097 samples/s/p 1:31:43 } +2024-07-25 23:40:47,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1141/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 5.4218544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:47,620 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.44106 samples/s/p 1:31:30 } +2024-07-25 23:40:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1143/ 1625], loss: 1.033, per_step_time: 1471ms, lr: 5.4173765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:50,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43835 samples/s/p 1:31:29 } +2024-07-25 23:40:53,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1145/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.4129005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:53,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.0% |██████████████████████████████████████ | 5.43625 samples/s/p 1:31:29 } +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1147/ 1625], loss: 1.098, per_step_time: 1476ms, lr: 5.4084253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:56,478 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.41894 samples/s/p 1:31:43 } +2024-07-25 23:40:59,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1149/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 5.4039533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:40:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43425 samples/s/p 1:31:25 } +2024-07-25 23:41:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1151/ 1625], loss: 1.111, per_step_time: 1473ms, lr: 5.3994845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:02,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43047 samples/s/p 1:31:26 } +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1153/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 5.3950143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:05,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43581 samples/s/p 1:31:17 } +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1155/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 5.390547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:08,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.42918 samples/s/p 1:31:21 } +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1157/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 5.386085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:11,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43393 samples/s/p 1:31:13 } +2024-07-25 23:41:14,186 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1159/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 5.3816193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43956 samples/s/p 1:31:05 } +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1161/ 1625], loss: 1.161, per_step_time: 1471ms, lr: 5.377158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:17,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.1% |██████████████████████████████████████ | 5.43840 samples/s/p 1:31:03 } +2024-07-25 23:41:20,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1163/ 1625], loss: 1.136, per_step_time: 1470ms, lr: 5.372701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:20,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43969 samples/s/p 1:30:59 } +2024-07-25 23:41:23,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1165/ 1625], loss: 1.183, per_step_time: 1472ms, lr: 5.368241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:23,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43319 samples/s/p 1:31:02 } +2024-07-25 23:41:25,986 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1167/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 5.363788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:25,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43500 samples/s/p 1:30:57 } +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1169/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 5.359334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:28,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43753 samples/s/p 1:30:52 } +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1171/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 5.3548797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:31,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43802 samples/s/p 1:30:49 } +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1173/ 1625], loss: 1.267, per_step_time: 1472ms, lr: 5.350432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:34,838 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43159 samples/s/p 1:30:52 } +2024-07-25 23:41:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1175/ 1625], loss: 1.012, per_step_time: 1471ms, lr: 5.3459844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:37,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43639 samples/s/p 1:30:44 } +2024-07-25 23:41:40,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1177/ 1625], loss: 1.123, per_step_time: 1473ms, lr: 5.341535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:40,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.2% |██████████████████████████████████████ | 5.43064 samples/s/p 1:30:47 } +2024-07-25 23:41:43,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1179/ 1625], loss: 1.292, per_step_time: 1471ms, lr: 5.3370936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:43,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43663 samples/s/p 1:30:38 } +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1181/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 5.3326517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:46,645 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43037 samples/s/p 1:30:41 } +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1183/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 5.328211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:49,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.42457 samples/s/p 1:30:44 } +2024-07-25 23:41:52,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1185/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.323772e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:52,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43730 samples/s/p 1:30:29 } +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1187/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 5.319335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:55,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43706 samples/s/p 1:30:26 } +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1189/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 5.3149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:41:58,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43434 samples/s/p 1:30:26 } +2024-07-25 23:42:01,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1191/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 5.3104673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:01,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43164 samples/s/p 1:30:25 } +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1193/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 5.306036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:04,357 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.3% |██████████████████████████████████████ | 5.43186 samples/s/p 1:30:22 } +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1195/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 5.301609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:07,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43474 samples/s/p 1:30:17 } +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1197/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 5.2971795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:10,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43858 samples/s/p 1:30:10 } +2024-07-25 23:42:13,207 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1199/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 5.2927535e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:13,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43769 samples/s/p 1:30:08 } +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1201/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 5.288333e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:16,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43896 samples/s/p 1:30:03 } +2024-07-25 23:42:19,109 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1203/ 1625], loss: 1.358, per_step_time: 1473ms, lr: 5.2839086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:19,110 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43031 samples/s/p 1:30:09 } +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1205/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 5.2794885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:22,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43553 samples/s/p 1:30:01 } +2024-07-25 23:42:25,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1207/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 5.275073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:25,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43488 samples/s/p 1:29:59 } +2024-07-25 23:42:27,961 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1209/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 5.270654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:27,962 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.4% |██████████████████████████████████████ | 5.43496 samples/s/p 1:29:56 } +2024-07-25 23:42:30,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1211/ 1625], loss: 0.974, per_step_time: 1474ms, lr: 5.266243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:30,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42427 samples/s/p 1:30:03 } +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1213/ 1625], loss: 1.045, per_step_time: 1471ms, lr: 5.2618298e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:33,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43654 samples/s/p 1:29:48 } +2024-07-25 23:42:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1215/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 5.257417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43547 samples/s/p 1:29:46 } +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1217/ 1625], loss: 0.947, per_step_time: 1471ms, lr: 5.253011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43505 samples/s/p 1:29:44 } +2024-07-25 23:42:42,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1219/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 5.248604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:42,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43226 samples/s/p 1:29:44 } +2024-07-25 23:42:45,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1221/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 5.244197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:45,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42751 samples/s/p 1:29:45 } +2024-07-25 23:42:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1223/ 1625], loss: 1.192, per_step_time: 1473ms, lr: 5.2397972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:48,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.43055 samples/s/p 1:29:39 } +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1225/ 1625], loss: 1.260, per_step_time: 1473ms, lr: 5.2353953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:42:51,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.5% |██████████████████████████████████████ | 5.42919 samples/s/p 1:29:38 } +2024-07-25 23:42:51,585 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1227/ 1625], loss: 0.972, per_step_time: 1729ms, lr: 5.230997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:27,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 4.62628 samples/s/p 1:45:08 } +2024-07-25 23:43:30,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1229/ 1625], loss: 1.169, per_step_time: 1474ms, lr: 5.226599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:30,188 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42726 samples/s/p 1:29:34 } +2024-07-25 23:43:33,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1231/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 5.222204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:33,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43645 samples/s/p 1:29:22 } +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1233/ 1625], loss: 1.239, per_step_time: 1473ms, lr: 5.21781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:36,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42840 samples/s/p 1:29:27 } +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1235/ 1625], loss: 0.976, per_step_time: 1472ms, lr: 5.2134196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:39,044 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43346 samples/s/p 1:29:19 } +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1237/ 1625], loss: 1.167, per_step_time: 1473ms, lr: 5.20903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:41,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43079 samples/s/p 1:29:19 } +2024-07-25 23:43:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1239/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 5.204644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:44,947 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43711 samples/s/p 1:29:09 } +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1241/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 5.200256e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:47,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.43580 samples/s/p 1:29:08 } +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1243/ 1625], loss: 1.210, per_step_time: 1473ms, lr: 5.1958723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.6% |██████████████████████████████████████ | 5.42945 samples/s/p 1:29:11 } +2024-07-25 23:43:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1245/ 1625], loss: 0.898, per_step_time: 1471ms, lr: 5.1914926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:53,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43682 samples/s/p 1:29:01 } +2024-07-25 23:43:56,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1247/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.1871107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:56,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43635 samples/s/p 1:28:58 } +2024-07-25 23:43:59,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1249/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 5.1827324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:43:59,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43548 samples/s/p 1:28:56 } +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1251/ 1625], loss: 1.108, per_step_time: 1476ms, lr: 5.178358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:02,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.41904 samples/s/p 1:29:10 } +2024-07-25 23:44:05,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1253/ 1625], loss: 1.395, per_step_time: 1473ms, lr: 5.1739808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:05,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43030 samples/s/p 1:28:55 } +2024-07-25 23:44:08,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1255/ 1625], loss: 1.357, per_step_time: 1470ms, lr: 5.169611e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:08,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43868 samples/s/p 1:28:44 } +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1257/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 5.1652405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:11,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43480 samples/s/p 1:28:45 } +2024-07-25 23:44:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1259/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 5.1608695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:14,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.7% |██████████████████████████████████████ | 5.43972 samples/s/p 1:28:37 } +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1261/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 5.1565053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:17,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43498 samples/s/p 1:28:39 } +2024-07-25 23:44:20,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1263/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 5.1521397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:20,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43562 samples/s/p 1:28:36 } +2024-07-25 23:44:23,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1265/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 5.147777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:23,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44059 samples/s/p 1:28:28 } +2024-07-25 23:44:26,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1267/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 5.143416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:26,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.42864 samples/s/p 1:28:36 } +2024-07-25 23:44:29,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1269/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 5.1390575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:29,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.44071 samples/s/p 1:28:22 } +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1271/ 1625], loss: 1.202, per_step_time: 1471ms, lr: 5.1346997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:32,164 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43716 samples/s/p 1:28:22 } +2024-07-25 23:44:35,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1273/ 1625], loss: 1.114, per_step_time: 1471ms, lr: 5.1303446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:35,115 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43537 samples/s/p 1:28:21 } +2024-07-25 23:44:38,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1275/ 1625], loss: 1.031, per_step_time: 1471ms, lr: 5.1259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:38,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.8% |██████████████████████████████████████ | 5.43689 samples/s/p 1:28:17 } +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1277/ 1625], loss: 1.221, per_step_time: 1473ms, lr: 5.12164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:41,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42805 samples/s/p 1:28:22 } +2024-07-25 23:44:43,970 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1279/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 5.1172897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:43,970 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43389 samples/s/p 1:28:14 } +2024-07-25 23:44:46,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1281/ 1625], loss: 1.144, per_step_time: 1472ms, lr: 5.1129427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:46,924 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43129 samples/s/p 1:28:13 } +2024-07-25 23:44:49,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1283/ 1625], loss: 0.895, per_step_time: 1470ms, lr: 5.108599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:49,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43858 samples/s/p 1:28:03 } +2024-07-25 23:44:52,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1285/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 5.1042534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:53,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43922 samples/s/p 1:28:00 } +2024-07-25 23:44:56,468 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1287/ 1625], loss: 1.298, per_step_time: 1475ms, lr: 5.099911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:56,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42368 samples/s/p 1:28:12 } +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1289/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 5.095573e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:44:59,420 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.43288 samples/s/p 1:28:00 } +2024-07-25 23:45:02,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1291/ 1625], loss: 1.193, per_step_time: 1475ms, lr: 5.091233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:02,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 77.9% |██████████████████████████████████████ | 5.42094 samples/s/p 1:28:09 } +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1293/ 1625], loss: 1.193, per_step_time: 1473ms, lr: 5.086899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:05,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43100 samples/s/p 1:27:56 } +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1295/ 1625], loss: 1.069, per_step_time: 1470ms, lr: 5.082565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:08,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.44056 samples/s/p 1:27:44 } +2024-07-25 23:45:11,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1297/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 5.07823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:11,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43268 samples/s/p 1:27:48 } +2024-07-25 23:45:14,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1299/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 5.073902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:14,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |██████████████████████████████████████ | 5.43204 samples/s/p 1:27:46 } +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1301/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 5.0695744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:17,141 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43381 samples/s/p 1:27:41 } +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1303/ 1625], loss: 1.122, per_step_time: 1475ms, lr: 5.0652447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:20,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.42208 samples/s/p 1:27:50 } +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1305/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 5.0609233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:23,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43769 samples/s/p 1:27:32 } +2024-07-25 23:45:26,000 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1307/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 5.0566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:26,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.0% |███████████████████████████████████████ | 5.43646 samples/s/p 1:27:30 } +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1309/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 5.05228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42787 samples/s/p 1:27:35 } +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1311/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 5.0479603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:31,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43438 samples/s/p 1:27:26 } +2024-07-25 23:45:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1313/ 1625], loss: 1.139, per_step_time: 1473ms, lr: 5.043644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:34,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43071 samples/s/p 1:27:27 } +2024-07-25 23:45:37,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1315/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 5.0393287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:37,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43270 samples/s/p 1:27:22 } +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1317/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 5.035016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:40,770 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43146 samples/s/p 1:27:20 } +2024-07-25 23:45:43,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1319/ 1625], loss: 1.213, per_step_time: 1473ms, lr: 5.030705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:43,725 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42854 samples/s/p 1:27:20 } +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1321/ 1625], loss: 1.253, per_step_time: 1473ms, lr: 5.0263957e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:46,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.42985 samples/s/p 1:27:16 } +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1323/ 1625], loss: 1.191, per_step_time: 1470ms, lr: 5.0220883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:49,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.1% |███████████████████████████████████████ | 5.43973 samples/s/p 1:27:03 } +2024-07-25 23:45:52,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1325/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 5.017783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:52,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43177 samples/s/p 1:27:08 } +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1327/ 1625], loss: 1.387, per_step_time: 1473ms, lr: 5.01348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:55,534 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42827 samples/s/p 1:27:08 } +2024-07-25 23:45:58,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1329/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 5.0091776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:45:58,490 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42652 samples/s/p 1:27:07 } +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1331/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 5.004879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:01,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42683 samples/s/p 1:27:04 } +2024-07-25 23:46:04,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1333/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 5.000584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:04,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42852 samples/s/p 1:26:59 } +2024-07-25 23:46:07,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1335/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 4.9962855e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:07,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.42963 samples/s/p 1:26:55 } +2024-07-25 23:46:10,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1337/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 4.9919945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:10,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43444 samples/s/p 1:26:48 } +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1339/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 4.9877026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:13,256 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.2% |███████████████████████████████████████ | 5.43401 samples/s/p 1:26:45 } +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1341/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 4.9834107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:16,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43603 samples/s/p 1:26:40 } +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1343/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 4.9791247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:19,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.42964 samples/s/p 1:26:44 } +2024-07-25 23:46:22,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1345/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 4.9748396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:22,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43506 samples/s/p 1:26:35 } +2024-07-25 23:46:25,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1347/ 1625], loss: 1.192, per_step_time: 1471ms, lr: 4.9705527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:25,061 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43536 samples/s/p 1:26:32 } +2024-07-25 23:46:28,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1349/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 4.966273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:28,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43222 samples/s/p 1:26:32 } +2024-07-25 23:46:30,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1351/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 4.961993e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:30,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43296 samples/s/p 1:26:29 } +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1353/ 1625], loss: 1.288, per_step_time: 1470ms, lr: 4.957715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:33,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43902 samples/s/p 1:26:20 } +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1355/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 4.9534397e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:36,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.3% |███████████████████████████████████████ | 5.43722 samples/s/p 1:26:19 } +2024-07-25 23:46:39,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1357/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 4.949165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:39,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43027 samples/s/p 1:26:22 } +2024-07-25 23:46:42,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1359/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 4.9448927e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:42,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.44049 samples/s/p 1:26:10 } +2024-07-25 23:46:45,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1361/ 1625], loss: 1.297, per_step_time: 1471ms, lr: 4.9406226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:45,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43684 samples/s/p 1:26:10 } +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1363/ 1625], loss: 1.276, per_step_time: 1471ms, lr: 4.936354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:48,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43525 samples/s/p 1:26:09 } +2024-07-25 23:46:51,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1365/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 4.932088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:51,617 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43783 samples/s/p 1:26:03 } +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1367/ 1625], loss: 1.256, per_step_time: 1472ms, lr: 4.9278233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:54,569 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43312 samples/s/p 1:26:05 } +2024-07-25 23:46:57,519 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1369/ 1625], loss: 1.018, per_step_time: 1471ms, lr: 4.92356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:46:57,520 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43499 samples/s/p 1:26:00 } +2024-07-25 23:47:00,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1371/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.919299e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:00,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.43088 samples/s/p 1:26:01 } +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1373/ 1625], loss: 1.125, per_step_time: 1483ms, lr: 4.915041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:03,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.4% |███████████████████████████████████████ | 5.39200 samples/s/p 1:26:35 } +2024-07-25 23:47:06,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1375/ 1625], loss: 1.255, per_step_time: 1470ms, lr: 4.9107844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:06,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43930 samples/s/p 1:25:47 } +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1377/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 4.9065297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:09,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43075 samples/s/p 1:25:52 } +2024-07-25 23:47:12,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1379/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 4.9022765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:12,300 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43259 samples/s/p 1:25:48 } +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1381/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 4.8980287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:15,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43720 samples/s/p 1:25:40 } +2024-07-25 23:47:18,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1383/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 4.8937773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:18,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43513 samples/s/p 1:25:39 } +2024-07-25 23:47:21,153 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1385/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 4.8895304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:21,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43309 samples/s/p 1:25:38 } +2024-07-25 23:47:24,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1387/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 4.8852876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:24,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43268 samples/s/p 1:25:36 } +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1389/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 4.881045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:27,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.5% |███████████████████████████████████████ | 5.43561 samples/s/p 1:25:30 } +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1391/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 4.8768015e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:30,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43086 samples/s/p 1:25:32 } +2024-07-25 23:47:32,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1393/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 4.8725647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:32,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.42964 samples/s/p 1:25:30 } +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1395/ 1625], loss: 1.056, per_step_time: 1469ms, lr: 4.8683273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:35,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.44268 samples/s/p 1:25:15 } +2024-07-25 23:47:38,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1397/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 4.8640923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:38,860 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43919 samples/s/p 1:25:15 } +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1399/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.85986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:41,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43128 samples/s/p 1:25:19 } +2024-07-25 23:47:44,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1401/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 4.8556276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:44,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43038 samples/s/p 1:25:17 } +2024-07-25 23:47:47,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1403/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 4.851399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:47,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43289 samples/s/p 1:25:12 } +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1405/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 4.8471716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:50,669 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.6% |███████████████████████████████████████ | 5.43364 samples/s/p 1:25:08 } +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1407/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 4.8429465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:53,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43270 samples/s/p 1:25:06 } +2024-07-25 23:47:56,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1409/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 4.8387237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:56,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43722 samples/s/p 1:24:59 } +2024-07-25 23:47:59,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1411/ 1625], loss: 1.067, per_step_time: 1471ms, lr: 4.8345014e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:47:59,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43665 samples/s/p 1:24:57 } +2024-07-25 23:48:02,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1413/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.8302823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:02,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43446 samples/s/p 1:24:56 } +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1415/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 4.8260645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:05,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43740 samples/s/p 1:24:50 } +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1417/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.8218494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:08,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43332 samples/s/p 1:24:51 } +2024-07-25 23:48:11,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1419/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 4.817638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:11,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43592 samples/s/p 1:24:46 } +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1421/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 4.8134248e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:14,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.7% |███████████████████████████████████████ | 5.43699 samples/s/p 1:24:42 } +2024-07-25 23:48:17,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1423/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 4.809215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:17,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43589 samples/s/p 1:24:40 } +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1425/ 1625], loss: 0.984, per_step_time: 1472ms, lr: 4.8050097e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:20,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43365 samples/s/p 1:24:39 } +2024-07-25 23:48:23,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1427/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.8008023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:23,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43674 samples/s/p 1:24:33 } +2024-07-25 23:48:26,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1429/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 4.796598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:26,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43298 samples/s/p 1:24:34 } +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1431/ 1625], loss: 0.991, per_step_time: 1470ms, lr: 4.792399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:29,024 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.44072 samples/s/p 1:24:24 } +2024-07-25 23:48:31,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1433/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 4.7881967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:31,976 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43525 samples/s/p 1:24:26 } +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1435/ 1625], loss: 1.359, per_step_time: 1471ms, lr: 4.7840017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:34,926 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43536 samples/s/p 1:24:23 } +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1437/ 1625], loss: 1.185, per_step_time: 1471ms, lr: 4.7798057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:37,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.8% |███████████████████████████████████████ | 5.43682 samples/s/p 1:24:18 } +2024-07-25 23:48:40,829 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1439/ 1625], loss: 0.954, per_step_time: 1473ms, lr: 4.775612e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:40,830 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43072 samples/s/p 1:24:21 } +2024-07-25 23:48:43,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1441/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 4.7714207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:43,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43122 samples/s/p 1:24:18 } +2024-07-25 23:48:46,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1443/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 4.7672306e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:46,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43116 samples/s/p 1:24:15 } +2024-07-25 23:48:49,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1445/ 1625], loss: 1.288, per_step_time: 1474ms, lr: 4.7630424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:49,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42679 samples/s/p 1:24:16 } +2024-07-25 23:48:52,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1447/ 1625], loss: 1.345, per_step_time: 1471ms, lr: 4.758857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:52,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43779 samples/s/p 1:24:03 } +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1449/ 1625], loss: 1.120, per_step_time: 1473ms, lr: 4.7546737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:55,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43020 samples/s/p 1:24:07 } +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1451/ 1625], loss: 1.057, per_step_time: 1473ms, lr: 4.7504914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:48:58,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.43093 samples/s/p 1:24:03 } +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1453/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 4.746311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:01,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 78.9% |███████████████████████████████████████ | 5.42909 samples/s/p 1:24:02 } +2024-07-25 23:49:04,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1455/ 1625], loss: 0.988, per_step_time: 1470ms, lr: 4.742134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:04,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43908 samples/s/p 1:23:50 } +2024-07-25 23:49:07,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1457/ 1625], loss: 1.376, per_step_time: 1472ms, lr: 4.737958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:07,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43455 samples/s/p 1:23:51 } +2024-07-25 23:49:10,357 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1459/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 4.7337835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:10,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43754 samples/s/p 1:23:45 } +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1461/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 4.7296116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:13,309 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43441 samples/s/p 1:23:45 } +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1463/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 4.7254443e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:16,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.43958 samples/s/p 1:23:38 } +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1465/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 4.721274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:19,205 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44032 samples/s/p 1:23:34 } +2024-07-25 23:49:22,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1467/ 1625], loss: 1.141, per_step_time: 1469ms, lr: 4.7171084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:22,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44364 samples/s/p 1:23:28 } +2024-07-25 23:49:25,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1469/ 1625], loss: 1.019, per_step_time: 1469ms, lr: 4.712947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:25,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.0% |███████████████████████████████████████ | 5.44304 samples/s/p 1:23:26 } +2024-07-25 23:49:28,047 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1471/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 4.708782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:28,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43694 samples/s/p 1:23:28 } +2024-07-25 23:49:31,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1473/ 1625], loss: 1.039, per_step_time: 1475ms, lr: 4.7046224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:31,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42328 samples/s/p 1:23:38 } +2024-07-25 23:49:33,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1475/ 1625], loss: 1.179, per_step_time: 1474ms, lr: 4.700467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:33,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.42722 samples/s/p 1:23:31 } +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1477/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.6963078e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:36,912 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43395 samples/s/p 1:23:22 } +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1479/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 4.692157e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:39,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43743 samples/s/p 1:23:16 } +2024-07-25 23:49:42,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1481/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 4.688005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:42,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43179 samples/s/p 1:23:18 } +2024-07-25 23:49:45,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1483/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 4.6838522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:45,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43666 samples/s/p 1:23:11 } +2024-07-25 23:49:48,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1485/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 4.6797063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:48,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.1% |███████████████████████████████████████ | 5.43198 samples/s/p 1:23:12 } +2024-07-25 23:49:51,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1487/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 4.6755604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:51,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.42872 samples/s/p 1:23:12 } +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1489/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 4.6714163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:54,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43384 samples/s/p 1:23:05 } +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1491/ 1625], loss: 1.251, per_step_time: 1473ms, lr: 4.667274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:49:57,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43100 samples/s/p 1:23:04 } +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1493/ 1625], loss: 1.224, per_step_time: 1471ms, lr: 4.663134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:00,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43844 samples/s/p 1:22:54 } +2024-07-25 23:50:03,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1495/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 4.6589967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:03,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43573 samples/s/p 1:22:54 } +2024-07-25 23:50:06,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1497/ 1625], loss: 1.164, per_step_time: 1471ms, lr: 4.6548603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:06,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43543 samples/s/p 1:22:51 } +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1499/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 4.6507257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:09,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43721 samples/s/p 1:22:47 } +2024-07-25 23:50:12,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1501/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 4.6465934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:12,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43166 samples/s/p 1:22:49 } +2024-07-25 23:50:15,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1503/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.6424643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:15,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.2% |███████████████████████████████████████ | 5.43460 samples/s/p 1:22:43 } +2024-07-25 23:50:18,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1505/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 4.6383366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:18,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43216 samples/s/p 1:22:43 } +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1507/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 4.634212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:21,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43079 samples/s/p 1:22:41 } +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1509/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 4.630086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:24,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43597 samples/s/p 1:22:33 } +2024-07-25 23:50:27,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1511/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 4.6259643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:27,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43555 samples/s/p 1:22:31 } +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1513/ 1625], loss: 1.123, per_step_time: 1482ms, lr: 4.621846e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:30,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.39636 samples/s/p 1:23:04 } +2024-07-25 23:50:33,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1515/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 4.617726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:33,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43986 samples/s/p 1:22:21 } +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1517/ 1625], loss: 1.159, per_step_time: 1473ms, lr: 4.6136106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.42961 samples/s/p 1:22:27 } +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1519/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 4.6094983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:38,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.3% |███████████████████████████████████████ | 5.43812 samples/s/p 1:22:17 } +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1521/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 4.6053838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:41,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.44041 samples/s/p 1:22:11 } +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1523/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 4.6012765e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:44,809 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43088 samples/s/p 1:22:17 } +2024-07-25 23:50:47,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1525/ 1625], loss: 1.379, per_step_time: 1472ms, lr: 4.5971688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:47,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43147 samples/s/p 1:22:14 } +2024-07-25 23:50:50,713 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1527/ 1625], loss: 1.326, per_step_time: 1472ms, lr: 4.593061e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:50,713 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43338 samples/s/p 1:22:09 } +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1529/ 1625], loss: 1.167, per_step_time: 1471ms, lr: 4.588959e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:53,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43845 samples/s/p 1:22:01 } +2024-07-25 23:50:56,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1531/ 1625], loss: 1.281, per_step_time: 1474ms, lr: 4.5848574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:56,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.42430 samples/s/p 1:22:11 } +2024-07-25 23:50:59,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1533/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 4.5807546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:50:59,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43841 samples/s/p 1:21:56 } +2024-07-25 23:51:02,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1535/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 4.5766587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:02,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.4% |███████████████████████████████████████ | 5.43663 samples/s/p 1:21:54 } +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1537/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 4.5725637e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:05,469 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43371 samples/s/p 1:21:54 } +2024-07-25 23:51:08,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1539/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 4.568469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:08,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43717 samples/s/p 1:21:48 } +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1541/ 1625], loss: 1.297, per_step_time: 1470ms, lr: 4.5643774e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:11,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43927 samples/s/p 1:21:43 } +2024-07-25 23:51:14,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1543/ 1625], loss: 0.955, per_step_time: 1471ms, lr: 4.560288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:14,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43686 samples/s/p 1:21:42 } +2024-07-25 23:51:17,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1545/ 1625], loss: 1.237, per_step_time: 1473ms, lr: 4.5561997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:17,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.42768 samples/s/p 1:21:48 } +2024-07-25 23:51:20,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1547/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.5521147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:20,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43402 samples/s/p 1:21:39 } +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1549/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 4.548031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:23,172 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43830 samples/s/p 1:21:32 } +2024-07-25 23:51:26,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1551/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 4.5439515e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:26,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.5% |███████████████████████████████████████ | 5.43609 samples/s/p 1:21:31 } +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1553/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 4.5398697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:29,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43381 samples/s/p 1:21:30 } +2024-07-25 23:51:32,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1555/ 1625], loss: 0.990, per_step_time: 1471ms, lr: 4.535792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:32,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43540 samples/s/p 1:21:26 } +2024-07-25 23:51:34,976 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1557/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 4.531719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:34,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43344 samples/s/p 1:21:25 } +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1559/ 1625], loss: 1.250, per_step_time: 1469ms, lr: 4.527643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:37,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.44383 samples/s/p 1:21:13 } +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1561/ 1625], loss: 1.327, per_step_time: 1471ms, lr: 4.523571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:40,872 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43836 samples/s/p 1:21:14 } +2024-07-25 23:51:43,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1563/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.519503e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:43,824 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43210 samples/s/p 1:21:17 } +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1565/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 4.5154343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:46,778 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.42902 samples/s/p 1:21:17 } +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1567/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 4.51137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:49,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.6% |███████████████████████████████████████ | 5.43716 samples/s/p 1:21:07 } +2024-07-25 23:51:52,674 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1569/ 1625], loss: 1.290, per_step_time: 1469ms, lr: 4.5073075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:52,675 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44257 samples/s/p 1:20:59 } +2024-07-25 23:51:55,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1571/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 4.503243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:55,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43890 samples/s/p 1:20:59 } +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1573/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 4.4991866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:51:58,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43257 samples/s/p 1:21:02 } +2024-07-25 23:52:01,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1575/ 1625], loss: 1.148, per_step_time: 1470ms, lr: 4.495129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:01,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.44109 samples/s/p 1:20:51 } +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1577/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 4.491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:04,474 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43482 samples/s/p 1:20:54 } +2024-07-25 23:52:07,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1579/ 1625], loss: 1.230, per_step_time: 1470ms, lr: 4.4870203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:07,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43993 samples/s/p 1:20:47 } +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1581/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 4.482969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:10,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.43561 samples/s/p 1:20:48 } +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1583/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 4.47892e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:13,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.7% |███████████████████████████████████████ | 5.42945 samples/s/p 1:20:50 } +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1585/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 4.474872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:16,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43575 samples/s/p 1:20:42 } +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1587/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 4.4708277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:19,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43318 samples/s/p 1:20:41 } +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1589/ 1625], loss: 1.270, per_step_time: 1474ms, lr: 4.4667863e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:22,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42504 samples/s/p 1:20:45 } +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1591/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.4627423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:25,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43326 samples/s/p 1:20:35 } +2024-07-25 23:52:28,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1593/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 4.4587036e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:28,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.42953 samples/s/p 1:20:35 } +2024-07-25 23:52:31,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1595/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 4.454668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:31,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43273 samples/s/p 1:20:29 } +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1597/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.4506323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:33,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43752 samples/s/p 1:20:22 } +2024-07-25 23:52:36,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1599/ 1625], loss: 1.094, per_step_time: 1472ms, lr: 4.4465987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:36,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.8% |███████████████████████████████████████ | 5.43289 samples/s/p 1:20:23 } +2024-07-25 23:52:39,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1601/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 4.4425697e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:39,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43062 samples/s/p 1:20:23 } +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1603/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 4.4385383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:42,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.42850 samples/s/p 1:20:21 } +2024-07-25 23:52:45,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1605/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 4.4345143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:45,803 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43356 samples/s/p 1:20:14 } +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1607/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 4.4304898e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:48,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43969 samples/s/p 1:20:06 } +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1609/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 4.426465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:51,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43473 samples/s/p 1:20:07 } +2024-07-25 23:52:54,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1611/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 4.4224466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:54,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43317 samples/s/p 1:20:06 } +2024-07-25 23:52:57,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1613/ 1625], loss: 1.323, per_step_time: 1471ms, lr: 4.418427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:52:57,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43681 samples/s/p 1:19:59 } +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1615/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 4.414409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:00,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 79.9% |███████████████████████████████████████ | 5.43895 samples/s/p 1:19:55 } +2024-07-25 23:53:03,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1617/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 4.4103963e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:03,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43194 samples/s/p 1:19:58 } +2024-07-25 23:53:06,453 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1619/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 4.4063836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:06,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43807 samples/s/p 1:19:49 } +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1621/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.402373e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:09,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43515 samples/s/p 1:19:49 } +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1623/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 4.3983646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:12,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |███████████████████████████████████████ | 5.43282 samples/s/p 1:19:48 } +2024-07-25 23:53:15,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 8/ 10], step:[ 1625/ 1625], loss: 1.001, per_step_time: 1472ms, lr: 4.394358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:15,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43348 samples/s/p 1:19:45 } +2024-07-25 23:53:18,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 2/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 4.3903538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:18,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42925 samples/s/p 1:19:45 } +2024-07-25 23:53:21,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 4/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 4.3863524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:21,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43232 samples/s/p 1:19:40 } +2024-07-25 23:53:24,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 6/ 1625], loss: 1.149, per_step_time: 1474ms, lr: 4.3823516e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:24,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.42513 samples/s/p 1:19:43 } +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 8/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 4.3783525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:27,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.0% |████████████████████████████████████████ | 5.43486 samples/s/p 1:19:32 } +2024-07-25 23:53:30,070 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 10/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.374357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:30,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43837 samples/s/p 1:19:26 } +2024-07-25 23:53:33,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 12/ 1625], loss: 1.269, per_step_time: 1471ms, lr: 4.3703635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:33,022 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43494 samples/s/p 1:19:26 } +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 14/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 4.366374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:35,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43604 samples/s/p 1:19:22 } +2024-07-25 23:53:38,924 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 16/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 4.362382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:38,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43137 samples/s/p 1:19:23 } +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 18/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 4.358393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:41,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43747 samples/s/p 1:19:15 } +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 20/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 4.35441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:44,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.43423 samples/s/p 1:19:15 } +2024-07-25 23:53:47,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 22/ 1625], loss: 1.292, per_step_time: 1475ms, lr: 4.350423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:47,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42303 samples/s/p 1:19:21 } +2024-07-25 23:53:50,737 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 24/ 1625], loss: 1.074, per_step_time: 1473ms, lr: 4.3464447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:50,738 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.1% |████████████████████████████████████████ | 5.42880 samples/s/p 1:19:13 } +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 26/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 4.342464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:53,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43535 samples/s/p 1:19:05 } +2024-07-25 23:53:56,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 28/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 4.338484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:56,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43836 samples/s/p 1:18:59 } +2024-07-25 23:53:59,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 30/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 4.334511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:53:59,587 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43691 samples/s/p 1:18:57 } +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 32/ 1625], loss: 1.037, per_step_time: 1469ms, lr: 4.330538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:02,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.44286 samples/s/p 1:18:49 } +2024-07-25 23:54:05,483 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 34/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 4.326564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:05,484 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43540 samples/s/p 1:18:53 } +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 36/ 1625], loss: 1.078, per_step_time: 1474ms, lr: 4.3225964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:08,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42613 samples/s/p 1:18:58 } +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 38/ 1625], loss: 1.167, per_step_time: 1474ms, lr: 4.318629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:11,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.42656 samples/s/p 1:18:55 } +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 40/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 4.3146647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:14,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.2% |████████████████████████████████████████ | 5.43562 samples/s/p 1:18:44 } +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 42/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 4.310701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:17,294 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43842 samples/s/p 1:18:39 } +2024-07-25 23:54:20,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 44/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 4.3067403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:20,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43498 samples/s/p 1:18:39 } +2024-07-25 23:54:23,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 46/ 1625], loss: 1.282, per_step_time: 1474ms, lr: 4.3027812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:23,200 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.42730 samples/s/p 1:18:42 } +2024-07-25 23:54:26,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 48/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 4.2988236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:26,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43480 samples/s/p 1:18:33 } +2024-07-25 23:54:29,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 50/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 4.2948686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:29,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43244 samples/s/p 1:18:32 } +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 52/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 4.2909155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:32,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43887 samples/s/p 1:18:23 } +2024-07-25 23:54:34,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 54/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 4.286965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:34,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.44118 samples/s/p 1:18:18 } +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 56/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 4.283017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:37,950 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.3% |████████████████████████████████████████ | 5.43395 samples/s/p 1:18:22 } +2024-07-25 23:54:40,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 58/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 4.2790707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:40,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43352 samples/s/p 1:18:19 } +2024-07-25 23:54:43,853 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 60/ 1625], loss: 1.024, per_step_time: 1472ms, lr: 4.2751253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:43,854 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43301 samples/s/p 1:18:17 } +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 62/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 4.2711836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:46,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43928 samples/s/p 1:18:08 } +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 64/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 4.267245e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:49,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43966 samples/s/p 1:18:05 } +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 66/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 4.263304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:52,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43274 samples/s/p 1:18:08 } +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 68/ 1625], loss: 1.264, per_step_time: 1472ms, lr: 4.2593706e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:55,655 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43166 samples/s/p 1:18:06 } +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 70/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 4.2554357e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:54:58,608 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43051 samples/s/p 1:18:04 } +2024-07-25 23:55:01,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 72/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 4.2515017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:01,560 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.4% |████████████████████████████████████████ | 5.43320 samples/s/p 1:17:59 } +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 74/ 1625], loss: 1.050, per_step_time: 1470ms, lr: 4.2475735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:04,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43856 samples/s/p 1:17:51 } +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 76/ 1625], loss: 1.153, per_step_time: 1470ms, lr: 4.2436454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:07,458 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43994 samples/s/p 1:17:47 } +2024-07-25 23:55:10,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 78/ 1625], loss: 1.068, per_step_time: 1471ms, lr: 4.2397182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:10,407 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43844 samples/s/p 1:17:46 } +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 80/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 4.235796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:13,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43456 samples/s/p 1:17:46 } +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 82/ 1625], loss: 1.076, per_step_time: 1471ms, lr: 4.231874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:16,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.43796 samples/s/p 1:17:40 } +2024-07-25 23:55:19,261 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 84/ 1625], loss: 1.051, per_step_time: 1473ms, lr: 4.2279544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:19,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42752 samples/s/p 1:17:46 } +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 86/ 1625], loss: 1.093, per_step_time: 1478ms, lr: 4.2240367e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:22,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.41248 samples/s/p 1:17:56 } +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 88/ 1625], loss: 1.113, per_step_time: 1473ms, lr: 4.220122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:25,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.5% |████████████████████████████████████████ | 5.42953 samples/s/p 1:17:38 } +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 90/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 4.2162083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:28,131 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43199 samples/s/p 1:17:33 } +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 92/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 4.2122965e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:31,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43122 samples/s/p 1:17:31 } +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 94/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 4.2083875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:34,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43530 samples/s/p 1:17:25 } +2024-07-25 23:55:36,985 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 96/ 1625], loss: 1.158, per_step_time: 1471ms, lr: 4.2044812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:36,986 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43542 samples/s/p 1:17:22 } +2024-07-25 23:55:39,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 98/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.2005754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43591 samples/s/p 1:17:18 } +2024-07-25 23:55:42,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 100/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 4.1966723e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:42,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43648 samples/s/p 1:17:15 } +2024-07-25 23:55:45,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 102/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 4.192771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:45,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43547 samples/s/p 1:17:13 } +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 104/ 1625], loss: 1.248, per_step_time: 1472ms, lr: 4.1888734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:48,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.6% |████████████████████████████████████████ | 5.43172 samples/s/p 1:17:13 } +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 106/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.1849753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:51,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43577 samples/s/p 1:17:07 } +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 108/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 4.181081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:54,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43267 samples/s/p 1:17:06 } +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 110/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 4.177189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:55:57,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43284 samples/s/p 1:17:03 } +2024-07-25 23:56:00,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 112/ 1625], loss: 1.520, per_step_time: 1473ms, lr: 4.1733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:00,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43011 samples/s/p 1:17:03 } +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 114/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 4.1694116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:03,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43534 samples/s/p 1:16:55 } +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 116/ 1625], loss: 1.222, per_step_time: 1470ms, lr: 4.1655235e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:06,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.44018 samples/s/p 1:16:48 } +2024-07-25 23:56:09,444 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 118/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 4.1616418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:09,444 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.43793 samples/s/p 1:16:47 } +2024-07-25 23:56:12,397 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 120/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 4.1577587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:12,398 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.7% |████████████████████████████████████████ | 5.42972 samples/s/p 1:16:51 } +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 122/ 1625], loss: 1.139, per_step_time: 1468ms, lr: 4.15388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:15,343 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44603 samples/s/p 1:16:34 } +2024-07-25 23:56:18,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 124/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 4.150001e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:18,298 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42745 samples/s/p 1:16:47 } +2024-07-25 23:56:21,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 126/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 4.146126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:21,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43517 samples/s/p 1:16:38 } +2024-07-25 23:56:24,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 128/ 1625], loss: 0.937, per_step_time: 1474ms, lr: 4.1422522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:24,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42679 samples/s/p 1:16:42 } +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 130/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 4.13838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:27,151 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44072 samples/s/p 1:16:27 } +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 132/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 4.134511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:30,101 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43684 samples/s/p 1:16:27 } +2024-07-25 23:56:33,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 134/ 1625], loss: 1.021, per_step_time: 1470ms, lr: 4.1306434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:33,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.44088 samples/s/p 1:16:21 } +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 136/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 4.126778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:35,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.43554 samples/s/p 1:16:23 } +2024-07-25 23:56:38,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 138/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 4.122915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:38,953 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.8% |████████████████████████████████████████ | 5.42980 samples/s/p 1:16:25 } +2024-07-25 23:56:41,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 140/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 4.1190533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:41,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43803 samples/s/p 1:16:15 } +2024-07-25 23:56:44,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 142/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 4.1151943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:44,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.42019 samples/s/p 1:16:27 } +2024-07-25 23:56:47,814 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 144/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 4.111337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:47,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43685 samples/s/p 1:16:10 } +2024-07-25 23:56:50,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 146/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 4.1074827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:50,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.42699 samples/s/p 1:16:15 } +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 148/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 4.1036305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:53,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43296 samples/s/p 1:16:07 } +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 150/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.099782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:56,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43581 samples/s/p 1:16:02 } +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 152/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 4.0959317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:56:59,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43814 samples/s/p 1:15:57 } +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 154/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 4.092085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:02,580 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 80.9% |████████████████████████████████████████ | 5.43054 samples/s/p 1:16:00 } +2024-07-25 23:57:05,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 156/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 4.0882423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:05,532 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43503 samples/s/p 1:15:54 } +2024-07-25 23:57:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 158/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 4.084398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:08,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43956 samples/s/p 1:15:47 } +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 160/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 4.080558e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43030 samples/s/p 1:15:52 } +2024-07-25 23:57:14,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 162/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 4.076722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:14,383 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43674 samples/s/p 1:15:43 } +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 164/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 4.072886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:17,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43325 samples/s/p 1:15:43 } +2024-07-25 23:57:20,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 166/ 1625], loss: 0.903, per_step_time: 1471ms, lr: 4.069052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:20,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43763 samples/s/p 1:15:37 } +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 168/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 4.0652208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:23,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43666 samples/s/p 1:15:35 } +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 170/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 4.0613913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.0% |████████████████████████████████████████ | 5.43607 samples/s/p 1:15:32 } +2024-07-25 23:57:29,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 172/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.0575633e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:29,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43534 samples/s/p 1:15:30 } +2024-07-25 23:57:32,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 174/ 1625], loss: 1.329, per_step_time: 1482ms, lr: 4.0537384e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.39593 samples/s/p 1:16:00 } +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 176/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 4.0499153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:35,054 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.44090 samples/s/p 1:15:19 } +2024-07-25 23:57:38,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 178/ 1625], loss: 1.092, per_step_time: 1470ms, lr: 4.0460936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:38,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43900 samples/s/p 1:15:18 } +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 180/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 4.0422756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:40,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43290 samples/s/p 1:15:20 } +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 182/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 4.038459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:43,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43642 samples/s/p 1:15:14 } +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 184/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 4.034644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:46,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43357 samples/s/p 1:15:14 } +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 186/ 1625], loss: 1.000, per_step_time: 1472ms, lr: 4.030831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:49,808 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.1% |████████████████████████████████████████ | 5.43415 samples/s/p 1:15:10 } +2024-07-25 23:57:52,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 188/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 4.027021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:52,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43893 samples/s/p 1:15:03 } +2024-07-25 23:57:55,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 190/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 4.023212e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:55,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43517 samples/s/p 1:15:03 } +2024-07-25 23:57:58,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 192/ 1625], loss: 1.094, per_step_time: 1475ms, lr: 4.019406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:57:58,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.42105 samples/s/p 1:15:12 } +2024-07-25 23:58:01,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 194/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 4.015604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:01,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43296 samples/s/p 1:14:59 } +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 196/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 4.0118007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:04,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43730 samples/s/p 1:14:53 } +2024-07-25 23:58:07,517 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 198/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 4.0080004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:07,518 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43546 samples/s/p 1:14:51 } +2024-07-25 23:58:10,467 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 200/ 1625], loss: 1.201, per_step_time: 1471ms, lr: 4.0042046e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:10,468 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43591 samples/s/p 1:14:48 } +2024-07-25 23:58:13,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 202/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 4.000406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:13,418 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.2% |████████████████████████████████████████ | 5.43639 samples/s/p 1:14:45 } +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 204/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.9966126e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:16,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43395 samples/s/p 1:14:44 } +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 206/ 1625], loss: 1.207, per_step_time: 1470ms, lr: 3.9928236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:19,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.44048 samples/s/p 1:14:36 } +2024-07-25 23:58:22,268 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 208/ 1625], loss: 1.078, per_step_time: 1472ms, lr: 3.9890315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:22,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43294 samples/s/p 1:14:39 } +2024-07-25 23:58:25,219 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 210/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.9852466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:25,220 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43489 samples/s/p 1:14:34 } +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 212/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 3.9814613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:28,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43297 samples/s/p 1:14:33 } +2024-07-25 23:58:31,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 214/ 1625], loss: 1.071, per_step_time: 1470ms, lr: 3.977679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:31,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43913 samples/s/p 1:14:25 } +2024-07-25 23:58:34,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 216/ 1625], loss: 1.060, per_step_time: 1471ms, lr: 3.973899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:34,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43824 samples/s/p 1:14:23 } +2024-07-25 23:58:37,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 218/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 3.9701185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:37,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.3% |████████████████████████████████████████ | 5.43281 samples/s/p 1:14:24 } +2024-07-25 23:58:39,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 220/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 3.9663437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:39,973 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43289 samples/s/p 1:14:21 } +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 222/ 1625], loss: 1.308, per_step_time: 1471ms, lr: 3.9625684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:42,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43577 samples/s/p 1:14:16 } +2024-07-25 23:58:45,873 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 224/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.958796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:45,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43524 samples/s/p 1:14:13 } +2024-07-25 23:58:48,821 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 226/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 3.955026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:48,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44031 samples/s/p 1:14:06 } +2024-07-25 23:58:51,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 228/ 1625], loss: 1.006, per_step_time: 1471ms, lr: 3.951258e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:51,773 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.43632 samples/s/p 1:14:07 } +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 230/ 1625], loss: 1.118, per_step_time: 1469ms, lr: 3.947492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:54,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44359 samples/s/p 1:13:58 } +2024-07-25 23:58:57,666 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 232/ 1625], loss: 1.048, per_step_time: 1470ms, lr: 3.943728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:58:57,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44094 samples/s/p 1:13:57 } +2024-07-25 23:59:00,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 234/ 1625], loss: 1.132, per_step_time: 1469ms, lr: 3.939966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:00,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.4% |████████████████████████████████████████ | 5.44422 samples/s/p 1:13:51 } +2024-07-25 23:59:03,560 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 236/ 1625], loss: 1.156, per_step_time: 1470ms, lr: 3.936207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:03,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.44038 samples/s/p 1:13:52 } +2024-07-25 23:59:06,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 238/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 3.9324523e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:06,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43433 samples/s/p 1:13:54 } +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 240/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.928695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:09,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43357 samples/s/p 1:13:51 } +2024-07-25 23:59:12,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 242/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 3.9249417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:12,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43361 samples/s/p 1:13:48 } +2024-07-25 23:59:15,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 244/ 1625], loss: 0.906, per_step_time: 1470ms, lr: 3.9211923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:15,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43903 samples/s/p 1:13:41 } +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 246/ 1625], loss: 1.091, per_step_time: 1473ms, lr: 3.9174415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:18,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.43064 samples/s/p 1:13:45 } +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 248/ 1625], loss: 1.137, per_step_time: 1482ms, lr: 3.913695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:21,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.39736 samples/s/p 1:14:09 } +2024-07-25 23:59:24,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 250/ 1625], loss: 1.101, per_step_time: 1473ms, lr: 3.9099527e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:24,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.5% |████████████████████████████████████████ | 5.42838 samples/s/p 1:13:41 } +2024-07-25 23:59:27,185 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 252/ 1625], loss: 1.115, per_step_time: 1468ms, lr: 3.906208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:27,186 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.44918 samples/s/p 1:13:21 } +2024-07-25 23:59:30,135 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 254/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.90247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:30,136 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43655 samples/s/p 1:13:28 } +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 256/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 3.898732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:33,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43744 samples/s/p 1:13:25 } +2024-07-25 23:59:36,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 258/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.894994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:36,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43493 samples/s/p 1:13:24 } +2024-07-25 23:59:38,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 260/ 1625], loss: 1.210, per_step_time: 1470ms, lr: 3.891262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:38,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43860 samples/s/p 1:13:18 } +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 262/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.88753e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:41,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43746 samples/s/p 1:13:16 } +2024-07-25 23:59:44,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 264/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 3.8838007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:44,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43440 samples/s/p 1:13:15 } +2024-07-25 23:59:47,834 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 266/ 1625], loss: 0.961, per_step_time: 1471ms, lr: 3.880073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:47,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43784 samples/s/p 1:13:09 } +2024-07-25 23:59:50,787 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 268/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 3.8763483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:50,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.6% |████████████████████████████████████████ | 5.43130 samples/s/p 1:13:12 } +2024-07-25 23:59:53,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 270/ 1625], loss: 0.994, per_step_time: 1471ms, lr: 3.872625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:53,737 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43797 samples/s/p 1:13:03 } +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 272/ 1625], loss: 1.267, per_step_time: 1473ms, lr: 3.868904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:56,690 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43004 samples/s/p 1:13:07 } +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 274/ 1625], loss: 1.012, per_step_time: 1471ms, lr: 3.865185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-25 23:59:59,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43504 samples/s/p 1:13:00 } +2024-07-26 00:00:02,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 276/ 1625], loss: 1.265, per_step_time: 1473ms, lr: 3.861469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:02,595 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.42951 samples/s/p 1:13:01 } +2024-07-26 00:00:05,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 278/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 3.8577537e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:05,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.44117 samples/s/p 1:12:49 } +2024-07-26 00:00:08,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 280/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 3.8540416e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:08,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43579 samples/s/p 1:12:51 } +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 282/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 3.8503335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:11,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.43915 samples/s/p 1:12:45 } +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 284/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.8466233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:14,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.7% |████████████████████████████████████████ | 5.42919 samples/s/p 1:12:50 } +2024-07-26 00:00:17,347 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 286/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 3.8429175e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:17,348 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43239 samples/s/p 1:12:44 } +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 288/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 3.839216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:20,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43177 samples/s/p 1:12:42 } +2024-07-26 00:00:23,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 290/ 1625], loss: 0.970, per_step_time: 1473ms, lr: 3.8355124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:23,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43081 samples/s/p 1:12:40 } +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 292/ 1625], loss: 1.233, per_step_time: 1469ms, lr: 3.8318144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:26,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.44232 samples/s/p 1:12:28 } +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 294/ 1625], loss: 1.117, per_step_time: 1473ms, lr: 3.828117e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:29,154 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43082 samples/s/p 1:12:34 } +2024-07-26 00:00:32,106 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 296/ 1625], loss: 1.280, per_step_time: 1472ms, lr: 3.8244198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:32,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43238 samples/s/p 1:12:30 } +2024-07-26 00:00:35,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 298/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 3.820728e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:35,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43712 samples/s/p 1:12:23 } +2024-07-26 00:00:38,007 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 300/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 3.817038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:38,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.8% |████████████████████████████████████████ | 5.43428 samples/s/p 1:12:22 } +2024-07-26 00:00:40,957 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 302/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 3.8133467e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:40,958 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43656 samples/s/p 1:12:18 } +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 304/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 3.8096632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:43,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43140 samples/s/p 1:12:19 } +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 306/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 3.8059788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:46,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42776 samples/s/p 1:12:19 } +2024-07-26 00:00:49,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 308/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 3.802295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:49,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43324 samples/s/p 1:12:11 } +2024-07-26 00:00:52,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 310/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 3.798616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:52,775 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43066 samples/s/p 1:12:10 } +2024-07-26 00:00:55,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 312/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 3.7949385e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:55,729 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43391 samples/s/p 1:12:05 } +2024-07-26 00:00:58,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 314/ 1625], loss: 1.327, per_step_time: 1473ms, lr: 3.7912619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:00:58,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.42951 samples/s/p 1:12:05 } +2024-07-26 00:01:01,633 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 316/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 3.7875889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:01,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 81.9% |████████████████████████████████████████ | 5.43433 samples/s/p 1:11:59 } +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 318/ 1625], loss: 1.219, per_step_time: 1472ms, lr: 3.7839172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43193 samples/s/p 1:11:58 } +2024-07-26 00:01:07,534 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 320/ 1625], loss: 1.129, per_step_time: 1470ms, lr: 3.7802492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:07,535 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43946 samples/s/p 1:11:49 } +2024-07-26 00:01:10,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 322/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.7765808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:10,483 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43974 samples/s/p 1:11:46 } +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 324/ 1625], loss: 1.081, per_step_time: 1471ms, lr: 3.772916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:13,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |████████████████████████████████████████ | 5.43515 samples/s/p 1:11:46 } +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 326/ 1625], loss: 1.304, per_step_time: 1470ms, lr: 3.7692557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:16,381 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43984 samples/s/p 1:11:40 } +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 328/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 3.7655932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:19,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43444 samples/s/p 1:11:41 } +2024-07-26 00:01:22,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 330/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 3.7619338e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43993 samples/s/p 1:11:34 } +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 332/ 1625], loss: 1.214, per_step_time: 1472ms, lr: 3.75828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:25,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.0% |█████████████████████████████████████████ | 5.43162 samples/s/p 1:11:37 } +2024-07-26 00:01:28,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 334/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 3.7546238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:28,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.44099 samples/s/p 1:11:27 } +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 336/ 1625], loss: 1.118, per_step_time: 1470ms, lr: 3.750974e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:31,129 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43918 samples/s/p 1:11:25 } +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 338/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 3.7473242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:34,080 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43449 samples/s/p 1:11:26 } +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 340/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 3.7436744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:37,031 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43424 samples/s/p 1:11:23 } +2024-07-26 00:01:39,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 342/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 3.740031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:39,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43499 samples/s/p 1:11:20 } +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 344/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 3.736388e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:42,935 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.42992 samples/s/p 1:11:21 } +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 346/ 1625], loss: 0.863, per_step_time: 1471ms, lr: 3.732745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:45,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43599 samples/s/p 1:11:13 } +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 348/ 1625], loss: 1.117, per_step_time: 1470ms, lr: 3.7291084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:48,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.1% |█████████████████████████████████████████ | 5.43864 samples/s/p 1:11:08 } +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 350/ 1625], loss: 1.044, per_step_time: 1473ms, lr: 3.7254713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:51,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42956 samples/s/p 1:11:12 } +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 352/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 3.721836e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:54,740 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43441 samples/s/p 1:11:06 } +2024-07-26 00:01:57,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 354/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 3.7182035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:01:57,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43171 samples/s/p 1:11:05 } +2024-07-26 00:02:00,650 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 356/ 1625], loss: 1.363, per_step_time: 1475ms, lr: 3.7145737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:00,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42173 samples/s/p 1:11:10 } +2024-07-26 00:02:03,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 358/ 1625], loss: 1.143, per_step_time: 1473ms, lr: 3.7109462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:03,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42799 samples/s/p 1:11:02 } +2024-07-26 00:02:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 360/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.70732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43795 samples/s/p 1:10:51 } +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 362/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 3.7036962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:09,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.43620 samples/s/p 1:10:50 } +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 364/ 1625], loss: 1.313, per_step_time: 1475ms, lr: 3.7000773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:12,462 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.2% |█████████████████████████████████████████ | 5.42333 samples/s/p 1:10:57 } +2024-07-26 00:02:15,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 366/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 3.6964552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:15,412 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43729 samples/s/p 1:10:43 } +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 368/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 3.6928382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:18,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43313 samples/s/p 1:10:43 } +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 370/ 1625], loss: 1.399, per_step_time: 1473ms, lr: 3.6892257e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42852 samples/s/p 1:10:44 } +2024-07-26 00:02:24,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 372/ 1625], loss: 1.125, per_step_time: 1473ms, lr: 3.6856104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:24,273 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42812 samples/s/p 1:10:41 } +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 374/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6819997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:27,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43693 samples/s/p 1:10:31 } +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 376/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 3.678394e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:30,176 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.43079 samples/s/p 1:10:33 } +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 378/ 1625], loss: 1.106, per_step_time: 1473ms, lr: 3.6747856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:33,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42914 samples/s/p 1:10:31 } +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 380/ 1625], loss: 1.104, per_step_time: 1474ms, lr: 3.671183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:36,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.3% |█████████████████████████████████████████ | 5.42543 samples/s/p 1:10:31 } +2024-07-26 00:02:39,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 382/ 1625], loss: 1.245, per_step_time: 1472ms, lr: 3.667582e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:39,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43334 samples/s/p 1:10:22 } +2024-07-26 00:02:41,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 384/ 1625], loss: 1.105, per_step_time: 1474ms, lr: 3.6639794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:41,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42380 samples/s/p 1:10:27 } +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 386/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 3.6603833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:44,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43354 samples/s/p 1:10:16 } +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 388/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.656788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:47,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43281 samples/s/p 1:10:14 } +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 390/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6531942e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:50,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43035 samples/s/p 1:10:13 } +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 392/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 3.6496049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:53,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43572 samples/s/p 1:10:06 } +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 394/ 1625], loss: 0.928, per_step_time: 1473ms, lr: 3.6460156e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:56,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.42776 samples/s/p 1:10:09 } +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 396/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 3.642429e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:02:59,707 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43455 samples/s/p 1:10:01 } +2024-07-26 00:03:02,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 398/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 3.638845e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:02,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.4% |█████████████████████████████████████████ | 5.43676 samples/s/p 1:09:56 } +2024-07-26 00:03:05,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 400/ 1625], loss: 1.184, per_step_time: 1471ms, lr: 3.6352626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:05,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43693 samples/s/p 1:09:53 } +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 402/ 1625], loss: 1.243, per_step_time: 1472ms, lr: 3.6316828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:08,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43239 samples/s/p 1:09:54 } +2024-07-26 00:03:11,510 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 404/ 1625], loss: 1.107, per_step_time: 1472ms, lr: 3.6281049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:11,511 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43369 samples/s/p 1:09:50 } +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 406/ 1625], loss: 1.180, per_step_time: 1472ms, lr: 3.6245292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:14,463 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43151 samples/s/p 1:09:48 } +2024-07-26 00:03:17,416 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 408/ 1625], loss: 1.059, per_step_time: 1473ms, lr: 3.6209553e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:17,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43029 samples/s/p 1:09:46 } +2024-07-26 00:03:20,370 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 410/ 1625], loss: 1.160, per_step_time: 1473ms, lr: 3.6173842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:20,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43021 samples/s/p 1:09:44 } +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 412/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 3.613815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:23,323 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43187 samples/s/p 1:09:39 } +2024-07-26 00:03:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 414/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 3.6102506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.5% |█████████████████████████████████████████ | 5.43108 samples/s/p 1:09:37 } +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 416/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 3.606684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:29,228 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43196 samples/s/p 1:09:33 } +2024-07-26 00:03:32,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 418/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 3.6031215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:32,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43174 samples/s/p 1:09:31 } +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 420/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 3.5995631e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:35,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43344 samples/s/p 1:09:26 } +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 422/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 3.5960024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:38,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43598 samples/s/p 1:09:21 } +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 424/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.5924495e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:41,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43263 samples/s/p 1:09:21 } +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 426/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 3.5888947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:43,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43150 samples/s/p 1:09:19 } +2024-07-26 00:03:46,938 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 428/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 3.5853418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:46,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43493 samples/s/p 1:09:13 } +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 430/ 1625], loss: 1.095, per_step_time: 1473ms, lr: 3.5817948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:49,892 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.6% |█████████████████████████████████████████ | 5.43100 samples/s/p 1:09:13 } +2024-07-26 00:03:52,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 432/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 3.5782468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:52,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43751 samples/s/p 1:09:06 } +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 434/ 1625], loss: 1.134, per_step_time: 1473ms, lr: 3.5747025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:55,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42969 samples/s/p 1:09:09 } +2024-07-26 00:03:58,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 436/ 1625], loss: 1.316, per_step_time: 1471ms, lr: 3.57116e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:03:58,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43518 samples/s/p 1:09:01 } +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 438/ 1625], loss: 1.138, per_step_time: 1474ms, lr: 3.567619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.42606 samples/s/p 1:09:05 } +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 440/ 1625], loss: 0.942, per_step_time: 1471ms, lr: 3.5640805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:04,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43794 samples/s/p 1:08:53 } +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 442/ 1625], loss: 1.173, per_step_time: 1473ms, lr: 3.5605449e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43071 samples/s/p 1:08:56 } +2024-07-26 00:04:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 444/ 1625], loss: 1.067, per_step_time: 1472ms, lr: 3.557011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43376 samples/s/p 1:08:51 } +2024-07-26 00:04:13,508 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 446/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 3.5534795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:13,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.7% |█████████████████████████████████████████ | 5.43147 samples/s/p 1:08:50 } +2024-07-26 00:04:16,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 448/ 1625], loss: 1.162, per_step_time: 1486ms, lr: 3.5499497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:16,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.38310 samples/s/p 1:09:24 } +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 450/ 1625], loss: 1.214, per_step_time: 1471ms, lr: 3.5464218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:19,438 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43591 samples/s/p 1:08:40 } +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 452/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.5428975e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:22,389 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43412 samples/s/p 1:08:39 } +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 454/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 3.5393746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:25,339 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43664 samples/s/p 1:08:34 } +2024-07-26 00:04:28,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 456/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.5358544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:28,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43577 samples/s/p 1:08:32 } +2024-07-26 00:04:31,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 458/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 3.532336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:31,241 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43481 samples/s/p 1:08:29 } +2024-07-26 00:04:34,200 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 460/ 1625], loss: 1.344, per_step_time: 1476ms, lr: 3.5288194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:34,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.41824 samples/s/p 1:08:39 } +2024-07-26 00:04:37,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 462/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 3.525307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:37,153 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.8% |█████████████████████████████████████████ | 5.43319 samples/s/p 1:08:25 } +2024-07-26 00:04:40,105 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 464/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.5217954e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:40,106 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43462 samples/s/p 1:08:21 } +2024-07-26 00:04:43,061 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 466/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 3.5182838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:43,062 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43134 samples/s/p 1:08:20 } +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 468/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.5147787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:46,011 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43760 samples/s/p 1:08:12 } +2024-07-26 00:04:48,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 470/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 3.511273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:48,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43873 samples/s/p 1:08:09 } +2024-07-26 00:04:51,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 472/ 1625], loss: 1.018, per_step_time: 1470ms, lr: 3.5077683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:51,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44200 samples/s/p 1:08:03 } +2024-07-26 00:04:54,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 474/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 3.50427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:54,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.44404 samples/s/p 1:07:59 } +2024-07-26 00:04:57,801 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 476/ 1625], loss: 1.278, per_step_time: 1471ms, lr: 3.5007715e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:04:57,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43811 samples/s/p 1:08:00 } +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 478/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 3.4972754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:00,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 82.9% |█████████████████████████████████████████ | 5.43077 samples/s/p 1:08:03 } +2024-07-26 00:05:03,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 480/ 1625], loss: 0.944, per_step_time: 1471ms, lr: 3.4937802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:03,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43500 samples/s/p 1:07:57 } +2024-07-26 00:05:06,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 482/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 3.4902887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:06,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.44051 samples/s/p 1:07:50 } +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 484/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 3.4867994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:09,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43712 samples/s/p 1:07:49 } +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 486/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.4833124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:12,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43565 samples/s/p 1:07:47 } +2024-07-26 00:05:15,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 488/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 3.4798268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:15,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43298 samples/s/p 1:07:47 } +2024-07-26 00:05:18,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 490/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 3.4763439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:18,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43664 samples/s/p 1:07:41 } +2024-07-26 00:05:21,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 492/ 1625], loss: 1.010, per_step_time: 1473ms, lr: 3.4728632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:21,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.42966 samples/s/p 1:07:43 } +2024-07-26 00:05:24,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 494/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 3.4693844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:24,361 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.0% |█████████████████████████████████████████ | 5.43671 samples/s/p 1:07:35 } +2024-07-26 00:05:27,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 496/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 3.4659074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:27,312 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43471 samples/s/p 1:07:33 } +2024-07-26 00:05:30,264 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 498/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 3.4624331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:30,264 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43118 samples/s/p 1:07:33 } +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 500/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 3.4589616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:33,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43880 samples/s/p 1:07:25 } +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 502/ 1625], loss: 1.184, per_step_time: 1473ms, lr: 3.4554914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:36,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43100 samples/s/p 1:07:27 } +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 504/ 1625], loss: 1.095, per_step_time: 1474ms, lr: 3.452024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:39,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42484 samples/s/p 1:07:29 } +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 506/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 3.448562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:42,073 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43483 samples/s/p 1:07:19 } +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 508/ 1625], loss: 1.050, per_step_time: 1473ms, lr: 3.4450968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:45,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.42820 samples/s/p 1:07:21 } +2024-07-26 00:05:47,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 510/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 3.4416348e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:47,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.1% |█████████████████████████████████████████ | 5.43245 samples/s/p 1:07:15 } +2024-07-26 00:05:50,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 512/ 1625], loss: 1.109, per_step_time: 1473ms, lr: 3.4381792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:50,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42876 samples/s/p 1:07:14 } +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 514/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 3.4347222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:53,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43463 samples/s/p 1:07:07 } +2024-07-26 00:05:56,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 516/ 1625], loss: 1.178, per_step_time: 1474ms, lr: 3.431267e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:56,842 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42392 samples/s/p 1:07:12 } +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 518/ 1625], loss: 1.259, per_step_time: 1473ms, lr: 3.4278169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:05:59,796 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.42841 samples/s/p 1:07:06 } +2024-07-26 00:06:02,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 520/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 3.4243667e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:02,748 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43330 samples/s/p 1:06:59 } +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 522/ 1625], loss: 1.001, per_step_time: 1471ms, lr: 3.4209197e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:05,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43534 samples/s/p 1:06:55 } +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 524/ 1625], loss: 0.867, per_step_time: 1471ms, lr: 3.417474e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:08,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43485 samples/s/p 1:06:52 } +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 526/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.4140307e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:11,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43795 samples/s/p 1:06:47 } +2024-07-26 00:06:14,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 528/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.4105901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:14,549 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.2% |█████████████████████████████████████████ | 5.43583 samples/s/p 1:06:46 } +2024-07-26 00:06:17,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 530/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 3.4071522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:17,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43689 samples/s/p 1:06:42 } +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 532/ 1625], loss: 1.207, per_step_time: 1472ms, lr: 3.4037148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:20,449 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43438 samples/s/p 1:06:41 } +2024-07-26 00:06:23,398 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 534/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 3.400282e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:23,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43765 samples/s/p 1:06:35 } +2024-07-26 00:06:26,349 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 536/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 3.39685e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:26,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43454 samples/s/p 1:06:35 } +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 538/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.3934198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:29,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43760 samples/s/p 1:06:29 } +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 540/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.3899928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:32,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43631 samples/s/p 1:06:27 } +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 542/ 1625], loss: 1.121, per_step_time: 1469ms, lr: 3.386568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:35,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.44291 samples/s/p 1:06:20 } +2024-07-26 00:06:38,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 544/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 3.3831452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:38,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.3% |█████████████████████████████████████████ | 5.43532 samples/s/p 1:06:22 } +2024-07-26 00:06:41,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 546/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 3.3797246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:41,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43258 samples/s/p 1:06:21 } +2024-07-26 00:06:44,044 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 548/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 3.3763054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:44,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.44557 samples/s/p 1:06:09 } +2024-07-26 00:06:46,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 550/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3728916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:46,997 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43287 samples/s/p 1:06:15 } +2024-07-26 00:06:49,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 552/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 3.369476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:49,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43331 samples/s/p 1:06:12 } +2024-07-26 00:06:52,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 554/ 1625], loss: 1.074, per_step_time: 1471ms, lr: 3.366064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:52,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43780 samples/s/p 1:06:06 } +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 556/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 3.3626561e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:55,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43363 samples/s/p 1:06:06 } +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 558/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 3.3592482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:06:58,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43191 samples/s/p 1:06:04 } +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 560/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 3.3558422e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:01,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.4% |█████████████████████████████████████████ | 5.43762 samples/s/p 1:05:57 } +2024-07-26 00:07:04,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 562/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 3.3524425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:04,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43487 samples/s/p 1:05:56 } +2024-07-26 00:07:07,655 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 564/ 1625], loss: 1.248, per_step_time: 1473ms, lr: 3.3490414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:07,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43062 samples/s/p 1:05:56 } +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 566/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 3.345643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:10,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.42860 samples/s/p 1:05:55 } +2024-07-26 00:07:13,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 568/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 3.3422466e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:13,561 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43382 samples/s/p 1:05:48 } +2024-07-26 00:07:16,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 570/ 1625], loss: 1.073, per_step_time: 1470ms, lr: 3.3388533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:16,509 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.44077 samples/s/p 1:05:40 } +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 572/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 3.3354622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:19,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43283 samples/s/p 1:05:43 } +2024-07-26 00:07:22,412 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 574/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 3.3320725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:22,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43425 samples/s/p 1:05:39 } +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 576/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 3.3286851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:25,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.5% |█████████████████████████████████████████ | 5.43192 samples/s/p 1:05:38 } +2024-07-26 00:07:28,315 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 578/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.325301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:28,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43570 samples/s/p 1:05:32 } +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 580/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.321918e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:31,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43268 samples/s/p 1:05:31 } +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 582/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 3.318538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:34,221 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.42966 samples/s/p 1:05:30 } +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 584/ 1625], loss: 1.067, per_step_time: 1473ms, lr: 3.3151605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:37,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43093 samples/s/p 1:05:27 } +2024-07-26 00:07:40,125 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 586/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 3.3117835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:40,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43418 samples/s/p 1:05:21 } +2024-07-26 00:07:43,075 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 588/ 1625], loss: 1.052, per_step_time: 1471ms, lr: 3.3084107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:43,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43571 samples/s/p 1:05:17 } +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 590/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 3.3050396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:46,029 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43018 samples/s/p 1:05:18 } +2024-07-26 00:07:48,977 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 592/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 3.3016709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:48,977 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.6% |█████████████████████████████████████████ | 5.43958 samples/s/p 1:05:09 } +2024-07-26 00:07:51,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 594/ 1625], loss: 1.179, per_step_time: 1472ms, lr: 3.2983044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:51,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43421 samples/s/p 1:05:10 } +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 596/ 1625], loss: 1.218, per_step_time: 1473ms, lr: 3.2949383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:54,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.42947 samples/s/p 1:05:10 } +2024-07-26 00:07:57,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 598/ 1625], loss: 1.168, per_step_time: 1471ms, lr: 3.2915755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:07:57,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43594 samples/s/p 1:05:02 } +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 600/ 1625], loss: 1.328, per_step_time: 1472ms, lr: 3.2882176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:00,785 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43165 samples/s/p 1:05:03 } +2024-07-26 00:08:03,732 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 602/ 1625], loss: 1.340, per_step_time: 1470ms, lr: 3.2848575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:03,733 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.44115 samples/s/p 1:04:53 } +2024-07-26 00:08:06,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 604/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 3.281505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:06,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43613 samples/s/p 1:04:53 } +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 606/ 1625], loss: 1.069, per_step_time: 1473ms, lr: 3.2781509e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:09,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.42816 samples/s/p 1:04:56 } +2024-07-26 00:08:12,589 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 608/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 3.274798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:12,590 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.7% |█████████████████████████████████████████ | 5.43164 samples/s/p 1:04:51 } +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 610/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 3.271452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:15,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43886 samples/s/p 1:04:43 } +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 612/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 3.2681055e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:18,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43646 samples/s/p 1:04:41 } +2024-07-26 00:08:21,438 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 614/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 3.2647613e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:21,439 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43589 samples/s/p 1:04:39 } +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 616/ 1625], loss: 1.279, per_step_time: 1473ms, lr: 3.2614184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:24,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.42968 samples/s/p 1:04:40 } +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 618/ 1625], loss: 1.291, per_step_time: 1470ms, lr: 3.2580788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:27,341 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43887 samples/s/p 1:04:31 } +2024-07-26 00:08:30,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 620/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 3.2547418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:30,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43711 samples/s/p 1:04:29 } +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 622/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 3.2514067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:33,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43771 samples/s/p 1:04:26 } +2024-07-26 00:08:36,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 624/ 1625], loss: 1.032, per_step_time: 1471ms, lr: 3.2480734e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:36,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.8% |█████████████████████████████████████████ | 5.43815 samples/s/p 1:04:23 } +2024-07-26 00:08:39,136 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 626/ 1625], loss: 1.105, per_step_time: 1469ms, lr: 3.2447433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:39,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.44262 samples/s/p 1:04:16 } +2024-07-26 00:08:42,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 628/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 3.241415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:42,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43840 samples/s/p 1:04:17 } +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 630/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 3.2380885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:45,036 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43577 samples/s/p 1:04:15 } +2024-07-26 00:08:47,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 632/ 1625], loss: 1.199, per_step_time: 1473ms, lr: 3.2347662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:47,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42754 samples/s/p 1:04:18 } +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 634/ 1625], loss: 1.274, per_step_time: 1473ms, lr: 3.2314433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:50,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.42949 samples/s/p 1:04:14 } +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 636/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 3.2281246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:53,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43440 samples/s/p 1:04:08 } +2024-07-26 00:08:56,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 638/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.224808e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:56,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43579 samples/s/p 1:04:04 } +2024-07-26 00:08:59,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 640/ 1625], loss: 1.188, per_step_time: 1473ms, lr: 3.221492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:08:59,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 83.9% |█████████████████████████████████████████ | 5.43037 samples/s/p 1:04:05 } +2024-07-26 00:09:02,754 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 642/ 1625], loss: 1.075, per_step_time: 1473ms, lr: 3.2181792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:02,755 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.42838 samples/s/p 1:04:03 } +2024-07-26 00:09:05,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 644/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 3.214871e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:05,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43471 samples/s/p 1:03:56 } +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 646/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 3.2115609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:08,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43358 samples/s/p 1:03:53 } +2024-07-26 00:09:11,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 648/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 3.2082567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:11,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |█████████████████████████████████████████ | 5.43712 samples/s/p 1:03:48 } +2024-07-26 00:09:14,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 650/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 3.2049534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:14,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43617 samples/s/p 1:03:46 } +2024-07-26 00:09:17,503 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 652/ 1625], loss: 1.200, per_step_time: 1469ms, lr: 3.20165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:17,504 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.44226 samples/s/p 1:03:39 } +2024-07-26 00:09:20,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 654/ 1625], loss: 1.020, per_step_time: 1470ms, lr: 3.1983536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:20,453 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43868 samples/s/p 1:03:38 } +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 656/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 3.1950567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:23,405 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43244 samples/s/p 1:03:40 } +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 658/ 1625], loss: 1.274, per_step_time: 1471ms, lr: 3.1917602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:26,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.0% |██████████████████████████████████████████ | 5.43527 samples/s/p 1:03:35 } +2024-07-26 00:09:29,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 660/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 3.1884701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:29,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43349 samples/s/p 1:03:33 } +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 662/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 3.1851805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:32,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43723 samples/s/p 1:03:27 } +2024-07-26 00:09:35,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 664/ 1625], loss: 0.933, per_step_time: 1477ms, lr: 3.1818931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:35,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.41342 samples/s/p 1:03:41 } +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 666/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 3.1786071e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:38,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43370 samples/s/p 1:03:24 } +2024-07-26 00:09:41,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 668/ 1625], loss: 1.047, per_step_time: 1473ms, lr: 3.1753243e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:41,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.42974 samples/s/p 1:03:24 } +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 670/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 3.1720447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:44,079 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43173 samples/s/p 1:03:19 } +2024-07-26 00:09:47,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 672/ 1625], loss: 1.009, per_step_time: 1475ms, lr: 3.1687646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:47,038 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.42050 samples/s/p 1:03:24 } +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 674/ 1625], loss: 1.014, per_step_time: 1472ms, lr: 3.1654881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:49,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.1% |██████████████████████████████████████████ | 5.43358 samples/s/p 1:03:12 } +2024-07-26 00:09:52,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 676/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 3.1622171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:52,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.42938 samples/s/p 1:03:12 } +2024-07-26 00:09:55,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 678/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 3.1589434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:55,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43986 samples/s/p 1:03:02 } +2024-07-26 00:09:58,840 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 680/ 1625], loss: 1.148, per_step_time: 1471ms, lr: 3.1556738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:09:58,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43682 samples/s/p 1:03:01 } +2024-07-26 00:10:01,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 682/ 1625], loss: 1.087, per_step_time: 1472ms, lr: 3.1524087e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:01,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43289 samples/s/p 1:03:01 } +2024-07-26 00:10:04,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 684/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 3.1491418e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:04,744 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43493 samples/s/p 1:02:57 } +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 686/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 3.1458799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:07,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43671 samples/s/p 1:02:52 } +2024-07-26 00:10:10,645 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 688/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 3.1426216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:10,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.43352 samples/s/p 1:02:52 } +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 690/ 1625], loss: 1.115, per_step_time: 1469ms, lr: 3.1393615e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:13,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.2% |██████████████████████████████████████████ | 5.44278 samples/s/p 1:02:42 } +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 692/ 1625], loss: 1.183, per_step_time: 1471ms, lr: 3.1361074e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:16,542 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43578 samples/s/p 1:02:44 } +2024-07-26 00:10:19,490 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 694/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 3.1328536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:19,491 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43930 samples/s/p 1:02:39 } +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 696/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 3.1296004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:22,445 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.42865 samples/s/p 1:02:43 } +2024-07-26 00:10:25,395 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 698/ 1625], loss: 1.118, per_step_time: 1471ms, lr: 3.1263544e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:25,396 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43505 samples/s/p 1:02:36 } +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 700/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 3.123107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:28,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43605 samples/s/p 1:02:32 } +2024-07-26 00:10:31,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 702/ 1625], loss: 1.047, per_step_time: 1471ms, lr: 3.119862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:31,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43485 samples/s/p 1:02:30 } +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 704/ 1625], loss: 1.301, per_step_time: 1472ms, lr: 3.116621e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:34,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43254 samples/s/p 1:02:29 } +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 706/ 1625], loss: 1.163, per_step_time: 1472ms, lr: 3.1133818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:37,202 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.3% |██████████████████████████████████████████ | 5.43208 samples/s/p 1:02:26 } +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 708/ 1625], loss: 1.261, per_step_time: 1470ms, lr: 3.110144e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:40,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43934 samples/s/p 1:02:18 } +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 710/ 1625], loss: 1.110, per_step_time: 1470ms, lr: 3.106909e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:43,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.44087 samples/s/p 1:02:14 } +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 712/ 1625], loss: 1.100, per_step_time: 1472ms, lr: 3.1036766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:46,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43191 samples/s/p 1:02:17 } +2024-07-26 00:10:49,002 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 714/ 1625], loss: 1.361, per_step_time: 1472ms, lr: 3.100446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:49,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43223 samples/s/p 1:02:14 } +2024-07-26 00:10:51,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 716/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 3.0972174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:51,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43095 samples/s/p 1:02:12 } +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 718/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 3.093991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:54,906 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43670 samples/s/p 1:02:05 } +2024-07-26 00:10:57,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 720/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 3.090769e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:10:57,857 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.43550 samples/s/p 1:02:03 } +2024-07-26 00:11:00,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 722/ 1625], loss: 1.131, per_step_time: 1474ms, lr: 3.0875462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:00,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.4% |██████████████████████████████████████████ | 5.42602 samples/s/p 1:02:07 } +2024-07-26 00:11:03,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 724/ 1625], loss: 1.065, per_step_time: 1472ms, lr: 3.0843275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:03,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43122 samples/s/p 1:02:00 } +2024-07-26 00:11:06,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 726/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 3.0811125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:06,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43704 samples/s/p 1:01:53 } +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 728/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 3.0778956e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:09,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43125 samples/s/p 1:01:54 } +2024-07-26 00:11:12,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 730/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 3.0746833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:12,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43597 samples/s/p 1:01:48 } +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 732/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 3.071475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:15,572 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42774 samples/s/p 1:01:51 } +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 734/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 3.0682659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:18,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.42538 samples/s/p 1:01:49 } +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 736/ 1625], loss: 1.108, per_step_time: 1473ms, lr: 3.0650622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:21,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43068 samples/s/p 1:01:43 } +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 738/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 3.0618598e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:24,432 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.5% |██████████████████████████████████████████ | 5.43669 samples/s/p 1:01:36 } +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 740/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 3.058657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:27,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43652 samples/s/p 1:01:33 } +2024-07-26 00:11:30,332 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 742/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 3.0554602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:30,333 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43503 samples/s/p 1:01:31 } +2024-07-26 00:11:33,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 744/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 3.0522642e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:33,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43453 samples/s/p 1:01:29 } +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 746/ 1625], loss: 1.211, per_step_time: 1473ms, lr: 3.0490683e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:36,238 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42867 samples/s/p 1:01:30 } +2024-07-26 00:11:39,189 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 748/ 1625], loss: 1.085, per_step_time: 1472ms, lr: 3.045879e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:39,190 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43378 samples/s/p 1:01:23 } +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 750/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 3.042689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:42,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.42998 samples/s/p 1:01:23 } +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 752/ 1625], loss: 1.215, per_step_time: 1471ms, lr: 3.0395022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:45,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43730 samples/s/p 1:01:15 } +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 754/ 1625], loss: 1.324, per_step_time: 1471ms, lr: 3.0363185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:48,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.6% |██████████████████████████████████████████ | 5.43519 samples/s/p 1:01:13 } +2024-07-26 00:11:50,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 756/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 3.0331362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:50,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44087 samples/s/p 1:01:07 } +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 758/ 1625], loss: 1.239, per_step_time: 1472ms, lr: 3.0299557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:53,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43166 samples/s/p 1:01:10 } +2024-07-26 00:11:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 760/ 1625], loss: 1.233, per_step_time: 1473ms, lr: 3.026778e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42865 samples/s/p 1:01:09 } +2024-07-26 00:11:59,849 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 762/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 3.0236024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:11:59,849 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43300 samples/s/p 1:01:03 } +2024-07-26 00:12:02,803 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 764/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 3.0204305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:02,804 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.42828 samples/s/p 1:01:03 } +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 766/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 3.0172578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:05,752 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43979 samples/s/p 1:00:53 } +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 768/ 1625], loss: 1.183, per_step_time: 1469ms, lr: 3.0140895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:08,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.44558 samples/s/p 1:00:46 } +2024-07-26 00:12:11,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 770/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 3.0109254e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:11,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.7% |██████████████████████████████████████████ | 5.43371 samples/s/p 1:00:51 } +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 772/ 1625], loss: 1.137, per_step_time: 1470ms, lr: 3.0077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:14,597 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43977 samples/s/p 1:00:44 } +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 774/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 3.004599e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43608 samples/s/p 1:00:43 } +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 776/ 1625], loss: 1.185, per_step_time: 1470ms, lr: 3.0014398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:20,495 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43966 samples/s/p 1:00:38 } +2024-07-26 00:12:23,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 778/ 1625], loss: 1.340, per_step_time: 1472ms, lr: 2.9982812e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43390 samples/s/p 1:00:39 } +2024-07-26 00:12:26,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 780/ 1625], loss: 1.123, per_step_time: 1470ms, lr: 2.9951293e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:26,395 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.44018 samples/s/p 1:00:32 } +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 782/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.9919756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:29,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43542 samples/s/p 1:00:32 } +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 784/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 2.9888242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:32,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43285 samples/s/p 1:00:31 } +2024-07-26 00:12:35,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 786/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 2.9856783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:35,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43889 samples/s/p 1:00:24 } +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 788/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 2.9825324e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:38,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.8% |██████████████████████████████████████████ | 5.43316 samples/s/p 1:00:25 } +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 790/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 2.9793891e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:41,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43274 samples/s/p 1:00:22 } +2024-07-26 00:12:44,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 792/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 2.9762482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:44,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43770 samples/s/p 1:00:16 } +2024-07-26 00:12:47,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 794/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 2.97311e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:47,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43474 samples/s/p 1:00:15 } +2024-07-26 00:12:50,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 796/ 1625], loss: 1.261, per_step_time: 1473ms, lr: 2.9699736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:50,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.42899 samples/s/p 1:00:16 } +2024-07-26 00:12:52,952 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 798/ 1625], loss: 1.240, per_step_time: 1469ms, lr: 2.96684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:52,952 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.44281 samples/s/p 1:00:04 } +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 800/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 2.9637085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:55,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43305 samples/s/p 1:00:07 } +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 802/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 2.960579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:12:58,855 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43447 samples/s/p 1:00:03 } +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 804/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.9574521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:01,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 84.9% |██████████████████████████████████████████ | 5.43267 samples/s/p 1:00:01 } +2024-07-26 00:13:04,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 806/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 2.954328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:04,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42951 samples/s/p 1:00:01 } +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 808/ 1625], loss: 1.087, per_step_time: 1473ms, lr: 2.9512053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:07,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43022 samples/s/p 0:59:57 } +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 810/ 1625], loss: 1.199, per_step_time: 1470ms, lr: 2.9480843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:10,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.44148 samples/s/p 0:59:47 } +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 812/ 1625], loss: 1.103, per_step_time: 1471ms, lr: 2.944967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:13,613 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43502 samples/s/p 0:59:48 } +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 814/ 1625], loss: 1.246, per_step_time: 1474ms, lr: 2.941853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:16,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.42730 samples/s/p 0:59:50 } +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 816/ 1625], loss: 1.147, per_step_time: 1473ms, lr: 2.9387393e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:19,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43065 samples/s/p 0:59:45 } +2024-07-26 00:13:22,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 818/ 1625], loss: 1.135, per_step_time: 1472ms, lr: 2.9356302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43344 samples/s/p 0:59:40 } +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 820/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.9325206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:25,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.0% |██████████████████████████████████████████ | 5.43213 samples/s/p 0:59:38 } +2024-07-26 00:13:28,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 822/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 2.9294138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:28,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43415 samples/s/p 0:59:34 } +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 824/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 2.926312e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:31,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43173 samples/s/p 0:59:33 } +2024-07-26 00:13:34,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 826/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.9232092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:34,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43370 samples/s/p 0:59:28 } +2024-07-26 00:13:37,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 828/ 1625], loss: 1.355, per_step_time: 1473ms, lr: 2.9201092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:37,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43088 samples/s/p 0:59:27 } +2024-07-26 00:13:40,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 830/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 2.9170133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:40,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43391 samples/s/p 0:59:22 } +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 832/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 2.91392e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:43,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43229 samples/s/p 0:59:20 } +2024-07-26 00:13:46,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 834/ 1625], loss: 1.292, per_step_time: 1470ms, lr: 2.9108269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:46,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43867 samples/s/p 0:59:13 } +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 836/ 1625], loss: 1.155, per_step_time: 1470ms, lr: 2.9077378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:49,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.1% |██████████████████████████████████████████ | 5.43918 samples/s/p 0:59:10 } +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 838/ 1625], loss: 1.157, per_step_time: 1470ms, lr: 2.9046491e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:51,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43900 samples/s/p 0:59:07 } +2024-07-26 00:13:54,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 840/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 2.9015653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:54,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43520 samples/s/p 0:59:07 } +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 842/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.8984814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:13:57,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43682 samples/s/p 0:59:03 } +2024-07-26 00:14:00,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 844/ 1625], loss: 1.302, per_step_time: 1473ms, lr: 2.8954005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43038 samples/s/p 0:59:04 } +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 846/ 1625], loss: 1.261, per_step_time: 1471ms, lr: 2.8923228e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:03,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43648 samples/s/p 0:58:57 } +2024-07-26 00:14:06,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 848/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 2.8892468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:06,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43882 samples/s/p 0:58:53 } +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 850/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 2.8861737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:09,685 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.43789 samples/s/p 0:58:50 } +2024-07-26 00:14:12,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 852/ 1625], loss: 1.092, per_step_time: 1473ms, lr: 2.8831018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:12,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.2% |██████████████████████████████████████████ | 5.42899 samples/s/p 0:58:53 } +2024-07-26 00:14:15,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 854/ 1625], loss: 1.217, per_step_time: 1472ms, lr: 2.8800328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:15,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43327 samples/s/p 0:58:47 } +2024-07-26 00:14:18,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 856/ 1625], loss: 1.174, per_step_time: 1473ms, lr: 2.8769664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:18,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43045 samples/s/p 0:58:46 } +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 858/ 1625], loss: 1.232, per_step_time: 1471ms, lr: 2.8739028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:21,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43839 samples/s/p 0:58:38 } +2024-07-26 00:14:24,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 860/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 2.8708405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:24,443 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43780 samples/s/p 0:58:36 } +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 862/ 1625], loss: 1.150, per_step_time: 1471ms, lr: 2.8677819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:27,394 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43479 samples/s/p 0:58:35 } +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 864/ 1625], loss: 1.125, per_step_time: 1471ms, lr: 2.864725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:30,345 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43497 samples/s/p 0:58:32 } +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 866/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 2.861669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:33,295 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43592 samples/s/p 0:58:28 } +2024-07-26 00:14:36,247 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 868/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.8586173e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:36,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.3% |██████████████████████████████████████████ | 5.43198 samples/s/p 0:58:28 } +2024-07-26 00:14:39,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 870/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 2.8555673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:39,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43682 samples/s/p 0:58:22 } +2024-07-26 00:14:42,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 872/ 1625], loss: 1.303, per_step_time: 1472ms, lr: 2.8525174e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:42,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43408 samples/s/p 0:58:20 } +2024-07-26 00:14:45,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 874/ 1625], loss: 1.195, per_step_time: 1469ms, lr: 2.8494742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:45,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.44395 samples/s/p 0:58:11 } +2024-07-26 00:14:48,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 876/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.846431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:48,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43434 samples/s/p 0:58:14 } +2024-07-26 00:14:50,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 878/ 1625], loss: 1.235, per_step_time: 1471ms, lr: 2.8433897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:50,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43679 samples/s/p 0:58:10 } +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 880/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 2.840351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:53,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43160 samples/s/p 0:58:10 } +2024-07-26 00:14:56,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 882/ 1625], loss: 1.040, per_step_time: 1471ms, lr: 2.8373138e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:56,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43787 samples/s/p 0:58:03 } +2024-07-26 00:14:59,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 884/ 1625], loss: 1.003, per_step_time: 1471ms, lr: 2.834281e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:14:59,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.4% |██████████████████████████████████████████ | 5.43637 samples/s/p 0:58:01 } +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 886/ 1625], loss: 1.338, per_step_time: 1471ms, lr: 2.8312493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:02,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43525 samples/s/p 0:57:59 } +2024-07-26 00:15:05,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 888/ 1625], loss: 1.086, per_step_time: 1470ms, lr: 2.8282202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:05,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43876 samples/s/p 0:57:54 } +2024-07-26 00:15:08,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 890/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 2.8251925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:08,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43246 samples/s/p 0:57:55 } +2024-07-26 00:15:11,649 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 892/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 2.8221684e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:11,650 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43563 samples/s/p 0:57:50 } +2024-07-26 00:15:14,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 894/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.8191462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:14,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44059 samples/s/p 0:57:44 } +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 896/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.8161264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:17,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43759 samples/s/p 0:57:43 } +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 898/ 1625], loss: 1.000, per_step_time: 1469ms, lr: 2.8131085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:20,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.44317 samples/s/p 0:57:36 } +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 900/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.810094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:23,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.5% |██████████████████████████████████████████ | 5.43025 samples/s/p 0:57:42 } +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 902/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.8070801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:26,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43141 samples/s/p 0:57:38 } +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 904/ 1625], loss: 0.917, per_step_time: 1471ms, lr: 2.8040708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:29,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43648 samples/s/p 0:57:32 } +2024-07-26 00:15:32,300 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 906/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.801064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:32,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43564 samples/s/p 0:57:29 } +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 908/ 1625], loss: 1.063, per_step_time: 1470ms, lr: 2.7980554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:35,250 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43850 samples/s/p 0:57:25 } +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 910/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 2.795052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:38,201 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43426 samples/s/p 0:57:24 } +2024-07-26 00:15:41,155 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 912/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.7920532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:41,156 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.42821 samples/s/p 0:57:25 } +2024-07-26 00:15:44,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 914/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.7890542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:44,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43249 samples/s/p 0:57:20 } +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 916/ 1625], loss: 0.870, per_step_time: 1472ms, lr: 2.7860576e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:47,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43228 samples/s/p 0:57:17 } +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 918/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 2.7830638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:50,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.6% |██████████████████████████████████████████ | 5.43642 samples/s/p 0:57:11 } +2024-07-26 00:15:52,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 920/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.7800718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:52,961 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43684 samples/s/p 0:57:08 } +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 922/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 2.7770823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:55,911 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43545 samples/s/p 0:57:06 } +2024-07-26 00:15:58,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 924/ 1625], loss: 1.066, per_step_time: 1472ms, lr: 2.7740953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:15:58,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43194 samples/s/p 0:57:05 } +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 926/ 1625], loss: 1.031, per_step_time: 1472ms, lr: 2.771111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:01,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43414 samples/s/p 0:57:01 } +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 928/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.7681276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:04,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43273 samples/s/p 0:56:59 } +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 930/ 1625], loss: 0.997, per_step_time: 1472ms, lr: 2.7651486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:07,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43471 samples/s/p 0:56:55 } +2024-07-26 00:16:10,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 932/ 1625], loss: 1.170, per_step_time: 1471ms, lr: 2.7621702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:10,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43771 samples/s/p 0:56:50 } +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 934/ 1625], loss: 1.073, per_step_time: 1473ms, lr: 2.7591964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:13,621 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.7% |██████████████████████████████████████████ | 5.43071 samples/s/p 0:56:51 } +2024-07-26 00:16:16,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 936/ 1625], loss: 1.287, per_step_time: 1472ms, lr: 2.7562223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:16,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43180 samples/s/p 0:56:48 } +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 938/ 1625], loss: 1.038, per_step_time: 1470ms, lr: 2.7532528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:19,522 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43911 samples/s/p 0:56:40 } +2024-07-26 00:16:22,472 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 940/ 1625], loss: 1.053, per_step_time: 1472ms, lr: 2.750283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:22,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43463 samples/s/p 0:56:40 } +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 942/ 1625], loss: 1.108, per_step_time: 1475ms, lr: 2.747317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:25,431 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.42085 samples/s/p 0:56:46 } +2024-07-26 00:16:28,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 944/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.744356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:28,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43235 samples/s/p 0:56:35 } +2024-07-26 00:16:31,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 946/ 1625], loss: 0.959, per_step_time: 1470ms, lr: 2.7413932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:31,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44018 samples/s/p 0:56:28 } +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 948/ 1625], loss: 0.966, per_step_time: 1471ms, lr: 2.738434e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:34,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.43677 samples/s/p 0:56:27 } +2024-07-26 00:16:37,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 950/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 2.735479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:37,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.8% |██████████████████████████████████████████ | 5.44157 samples/s/p 0:56:21 } +2024-07-26 00:16:40,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 952/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.732524e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:40,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43310 samples/s/p 0:56:23 } +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 954/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.7295719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:43,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43113 samples/s/p 0:56:21 } +2024-07-26 00:16:46,084 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 956/ 1625], loss: 1.193, per_step_time: 1472ms, lr: 2.7266237e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:46,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43365 samples/s/p 0:56:17 } +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 958/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.7236756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:49,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43204 samples/s/p 0:56:15 } +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 960/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 2.720732e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:51,990 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43029 samples/s/p 0:56:13 } +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 962/ 1625], loss: 1.231, per_step_time: 1470ms, lr: 2.7177894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:54,939 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43867 samples/s/p 0:56:05 } +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 964/ 1625], loss: 1.026, per_step_time: 1471ms, lr: 2.714848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:16:57,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.43514 samples/s/p 0:56:04 } +2024-07-26 00:17:00,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 966/ 1625], loss: 1.189, per_step_time: 1469ms, lr: 2.7119122e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:00,837 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 85.9% |██████████████████████████████████████████ | 5.44285 samples/s/p 0:55:57 } +2024-07-26 00:17:03,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 968/ 1625], loss: 0.983, per_step_time: 1472ms, lr: 2.7089773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:03,789 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43213 samples/s/p 0:56:00 } +2024-07-26 00:17:06,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 970/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 2.7060437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:06,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43670 samples/s/p 0:55:54 } +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 972/ 1625], loss: 1.264, per_step_time: 1473ms, lr: 2.703113e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:09,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.42925 samples/s/p 0:55:56 } +2024-07-26 00:17:12,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 974/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 2.700185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:12,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |██████████████████████████████████████████ | 5.43718 samples/s/p 0:55:48 } +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 976/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 2.6972593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:15,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43437 samples/s/p 0:55:47 } +2024-07-26 00:17:18,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 978/ 1625], loss: 1.108, per_step_time: 1472ms, lr: 2.6943355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:18,547 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43243 samples/s/p 0:55:45 } +2024-07-26 00:17:21,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 980/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 2.6914145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:21,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.42866 samples/s/p 0:55:45 } +2024-07-26 00:17:24,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 982/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 2.6884966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:24,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.0% |███████████████████████████████████████████ | 5.43824 samples/s/p 0:55:36 } +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 984/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 2.6855796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:27,400 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43506 samples/s/p 0:55:35 } +2024-07-26 00:17:30,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 986/ 1625], loss: 1.115, per_step_time: 1474ms, lr: 2.6826654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:30,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42652 samples/s/p 0:55:37 } +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 988/ 1625], loss: 1.194, per_step_time: 1473ms, lr: 2.679756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:33,311 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42770 samples/s/p 0:55:34 } +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 990/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 2.6768446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:36,262 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43468 samples/s/p 0:55:26 } +2024-07-26 00:17:39,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 992/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.673938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:39,213 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43563 samples/s/p 0:55:23 } +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 994/ 1625], loss: 1.203, per_step_time: 1471ms, lr: 2.671035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:42,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43699 samples/s/p 0:55:19 } +2024-07-26 00:17:45,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 996/ 1625], loss: 1.190, per_step_time: 1474ms, lr: 2.668131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:45,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.42632 samples/s/p 0:55:23 } +2024-07-26 00:17:48,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 998/ 1625], loss: 1.212, per_step_time: 1471ms, lr: 2.6652315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:48,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.1% |███████████████████████████████████████████ | 5.43772 samples/s/p 0:55:13 } +2024-07-26 00:17:51,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1000/ 1625], loss: 1.319, per_step_time: 1469ms, lr: 2.662336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44255 samples/s/p 0:55:07 } +2024-07-26 00:17:51,014 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1002/ 1625], loss: 1.150, per_step_time: 1476ms, lr: 2.659439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:27,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.41658 samples/s/p 0:55:20 } +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1004/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.656548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:29,988 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.42558 samples/s/p 0:55:11 } +2024-07-26 00:18:32,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1006/ 1625], loss: 1.134, per_step_time: 1469ms, lr: 2.653658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:32,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.44526 samples/s/p 0:54:56 } +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1008/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.6507678e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:35,883 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43681 samples/s/p 0:54:58 } +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1010/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 2.6478838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:38,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43298 samples/s/p 0:54:58 } +2024-07-26 00:18:41,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1012/ 1625], loss: 0.992, per_step_time: 1471ms, lr: 2.6450007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:41,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43568 samples/s/p 0:54:53 } +2024-07-26 00:18:44,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1014/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 2.6421183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:44,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.2% |███████████████████████████████████████████ | 5.43775 samples/s/p 0:54:49 } +2024-07-26 00:18:47,686 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1016/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 2.639241e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:47,686 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43328 samples/s/p 0:54:49 } +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1018/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.6363648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:50,634 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.44079 samples/s/p 0:54:41 } +2024-07-26 00:18:53,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1020/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 2.633492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:53,585 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43514 samples/s/p 0:54:42 } +2024-07-26 00:18:56,532 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1022/ 1625], loss: 1.070, per_step_time: 1470ms, lr: 2.6306209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:56,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43992 samples/s/p 0:54:36 } +2024-07-26 00:18:59,484 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1024/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 2.6277507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:18:59,485 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43255 samples/s/p 0:54:38 } +2024-07-26 00:19:02,434 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1026/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 2.6248856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:02,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43625 samples/s/p 0:54:32 } +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1028/ 1625], loss: 1.162, per_step_time: 1472ms, lr: 2.6220205e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:05,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43400 samples/s/p 0:54:31 } +2024-07-26 00:19:08,337 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1030/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.619159e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:08,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.3% |███████████████████████████████████████████ | 5.43369 samples/s/p 0:54:28 } +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1032/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.616301e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:11,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43139 samples/s/p 0:54:26 } +2024-07-26 00:19:14,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1034/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 2.613442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:14,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43195 samples/s/p 0:54:23 } +2024-07-26 00:19:17,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1036/ 1625], loss: 1.320, per_step_time: 1472ms, lr: 2.6105872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:17,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43279 samples/s/p 0:54:20 } +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1038/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 2.6077369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:20,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43326 samples/s/p 0:54:16 } +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1040/ 1625], loss: 1.152, per_step_time: 1473ms, lr: 2.6048856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:23,099 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43098 samples/s/p 0:54:15 } +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1042/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.6020389e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:26,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43210 samples/s/p 0:54:11 } +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1044/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 2.5991944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:29,001 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43661 samples/s/p 0:54:06 } +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1046/ 1625], loss: 1.062, per_step_time: 1470ms, lr: 2.5963493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:31,949 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.44044 samples/s/p 0:54:00 } +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1048/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 2.593511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:34,902 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.4% |███████████████████████████████████████████ | 5.43067 samples/s/p 0:54:03 } +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1050/ 1625], loss: 1.452, per_step_time: 1471ms, lr: 2.590673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:37,851 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43762 samples/s/p 0:53:56 } +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1052/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 2.5878362e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:40,805 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.42874 samples/s/p 0:53:59 } +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1054/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 2.585004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:43,758 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43139 samples/s/p 0:53:54 } +2024-07-26 00:19:46,709 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1056/ 1625], loss: 1.037, per_step_time: 1472ms, lr: 2.5821737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:46,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43450 samples/s/p 0:53:49 } +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1058/ 1625], loss: 1.155, per_step_time: 1478ms, lr: 2.5793431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:49,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.41113 samples/s/p 0:54:00 } +2024-07-26 00:19:52,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1060/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 2.5765178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:52,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43210 samples/s/p 0:53:45 } +2024-07-26 00:19:55,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1062/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 2.573695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:55,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43992 samples/s/p 0:53:37 } +2024-07-26 00:19:58,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1064/ 1625], loss: 1.249, per_step_time: 1472ms, lr: 2.5708741e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:19:58,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.5% |███████████████████████████████████████████ | 5.43367 samples/s/p 0:53:38 } +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1066/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 2.568054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:01,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43505 samples/s/p 0:53:34 } +2024-07-26 00:20:04,432 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1068/ 1625], loss: 1.254, per_step_time: 1474ms, lr: 2.5652375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:04,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.42606 samples/s/p 0:53:37 } +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1070/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 2.5624233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:07,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43374 samples/s/p 0:53:29 } +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1072/ 1625], loss: 1.112, per_step_time: 1477ms, lr: 2.5596119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:10,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.41532 samples/s/p 0:53:37 } +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1074/ 1625], loss: 1.253, per_step_time: 1471ms, lr: 2.556802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:13,296 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43653 samples/s/p 0:53:22 } +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1076/ 1625], loss: 1.187, per_step_time: 1472ms, lr: 2.5539966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:16,248 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43391 samples/s/p 0:53:20 } +2024-07-26 00:20:19,196 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1078/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 2.5511913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:19,197 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43929 samples/s/p 0:53:14 } +2024-07-26 00:20:22,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1080/ 1625], loss: 1.266, per_step_time: 1472ms, lr: 2.5483885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:22,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.6% |███████████████████████████████████████████ | 5.43193 samples/s/p 0:53:15 } +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1082/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 2.54559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:25,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43003 samples/s/p 0:53:14 } +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1084/ 1625], loss: 1.008, per_step_time: 1469ms, lr: 2.5427914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:28,050 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.44255 samples/s/p 0:53:03 } +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1086/ 1625], loss: 1.048, per_step_time: 1473ms, lr: 2.5399972e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:31,003 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43087 samples/s/p 0:53:07 } +2024-07-26 00:20:33,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1088/ 1625], loss: 1.269, per_step_time: 1472ms, lr: 2.5372049e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:33,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43235 samples/s/p 0:53:03 } +2024-07-26 00:20:36,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1090/ 1625], loss: 1.133, per_step_time: 1470ms, lr: 2.5344134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:36,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43964 samples/s/p 0:52:56 } +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1092/ 1625], loss: 1.072, per_step_time: 1474ms, lr: 2.5316276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:39,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.42643 samples/s/p 0:53:01 } +2024-07-26 00:20:42,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1094/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 2.5288423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:42,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.43359 samples/s/p 0:52:54 } +2024-07-26 00:20:45,770 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1096/ 1625], loss: 1.088, per_step_time: 1476ms, lr: 2.5260574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:45,771 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.7% |███████████████████████████████████████████ | 5.41802 samples/s/p 0:53:00 } +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1098/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 2.523278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:48,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43221 samples/s/p 0:52:49 } +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1100/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 2.5204995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:51,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43134 samples/s/p 0:52:46 } +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1102/ 1625], loss: 1.340, per_step_time: 1473ms, lr: 2.5177233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:54,631 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42852 samples/s/p 0:52:45 } +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1104/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 2.514951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:20:57,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43479 samples/s/p 0:52:38 } +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1106/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 2.512179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:00,533 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43428 samples/s/p 0:52:36 } +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1108/ 1625], loss: 1.153, per_step_time: 1473ms, lr: 2.50941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:03,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.42962 samples/s/p 0:52:36 } +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1110/ 1625], loss: 1.096, per_step_time: 1473ms, lr: 2.5066433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:06,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.43102 samples/s/p 0:52:32 } +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1112/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 2.5038803e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:09,386 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.8% |███████████████████████████████████████████ | 5.44448 samples/s/p 0:52:21 } +2024-07-26 00:21:12,336 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1114/ 1625], loss: 1.314, per_step_time: 1471ms, lr: 2.501119e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:12,337 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43638 samples/s/p 0:52:23 } +2024-07-26 00:21:15,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1116/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.4983597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:15,288 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43405 samples/s/p 0:52:21 } +2024-07-26 00:21:18,241 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1118/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.4956034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:18,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42922 samples/s/p 0:52:21 } +2024-07-26 00:21:21,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1120/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 2.49285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:21,195 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43118 samples/s/p 0:52:17 } +2024-07-26 00:21:24,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1122/ 1625], loss: 1.030, per_step_time: 1474ms, lr: 2.4900962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:24,150 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.42737 samples/s/p 0:52:16 } +2024-07-26 00:21:27,102 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1124/ 1625], loss: 1.075, per_step_time: 1473ms, lr: 2.487347e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:27,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43098 samples/s/p 0:52:11 } +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1126/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.4846013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:30,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43203 samples/s/p 0:52:08 } +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1128/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.4818555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:33,004 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 86.9% |███████████████████████████████████████████ | 5.43823 samples/s/p 0:52:01 } +2024-07-26 00:21:35,958 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1130/ 1625], loss: 1.253, per_step_time: 1474ms, lr: 2.4791148e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:35,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.42738 samples/s/p 0:52:04 } +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1132/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 2.4763742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:38,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43569 samples/s/p 0:51:57 } +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1134/ 1625], loss: 1.130, per_step_time: 1473ms, lr: 2.4736355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:41,862 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43041 samples/s/p 0:51:57 } +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1136/ 1625], loss: 1.156, per_step_time: 1473ms, lr: 2.4709016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:44,815 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43108 samples/s/p 0:51:53 } +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1138/ 1625], loss: 1.050, per_step_time: 1472ms, lr: 2.468169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:47,767 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43330 samples/s/p 0:51:49 } +2024-07-26 00:21:50,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1140/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 2.4654378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:50,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43231 samples/s/p 0:51:47 } +2024-07-26 00:21:53,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1142/ 1625], loss: 1.329, per_step_time: 1473ms, lr: 2.462711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:53,673 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43073 samples/s/p 0:51:45 } +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1144/ 1625], loss: 0.891, per_step_time: 1471ms, lr: 2.4599851e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:56,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.0% |███████████████████████████████████████████ | 5.43774 samples/s/p 0:51:38 } +2024-07-26 00:21:59,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1146/ 1625], loss: 1.090, per_step_time: 1472ms, lr: 2.4572619e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:21:59,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43394 samples/s/p 0:51:37 } +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1148/ 1625], loss: 1.045, per_step_time: 1473ms, lr: 2.454542e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:02,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42955 samples/s/p 0:51:37 } +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1150/ 1625], loss: 1.039, per_step_time: 1470ms, lr: 2.451823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:05,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.44063 samples/s/p 0:51:27 } +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1152/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.4491073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:08,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43640 samples/s/p 0:51:27 } +2024-07-26 00:22:11,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1154/ 1625], loss: 1.103, per_step_time: 1474ms, lr: 2.4463939e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:11,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.42531 samples/s/p 0:51:30 } +2024-07-26 00:22:14,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1156/ 1625], loss: 0.980, per_step_time: 1470ms, lr: 2.4436843e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:14,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.44034 samples/s/p 0:51:19 } +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1158/ 1625], loss: 1.250, per_step_time: 1471ms, lr: 2.4409746e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:17,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43572 samples/s/p 0:51:18 } +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1160/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 2.438269e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:20,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.1% |███████████████████████████████████████████ | 5.43349 samples/s/p 0:51:17 } +2024-07-26 00:22:23,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1162/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 2.4355654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:23,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43622 samples/s/p 0:51:12 } +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1164/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 2.4328629e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:26,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43381 samples/s/p 0:51:11 } +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1166/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.4301635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:29,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43430 samples/s/p 0:51:07 } +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1168/ 1625], loss: 1.249, per_step_time: 1474ms, lr: 2.427468e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:32,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.42490 samples/s/p 0:51:10 } +2024-07-26 00:22:34,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1170/ 1625], loss: 1.032, per_step_time: 1470ms, lr: 2.424775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:34,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43929 samples/s/p 0:50:59 } +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1172/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.4220817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:37,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43290 samples/s/p 0:50:59 } +2024-07-26 00:22:40,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1174/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 2.4193941e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:40,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43949 samples/s/p 0:50:53 } +2024-07-26 00:22:43,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1176/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 2.416707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:43,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.44016 samples/s/p 0:50:49 } +2024-07-26 00:22:46,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1178/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 2.4140209e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:46,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.2% |███████████████████████████████████████████ | 5.43308 samples/s/p 0:50:50 } +2024-07-26 00:22:49,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1180/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 2.41134e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:49,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43633 samples/s/p 0:50:46 } +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1182/ 1625], loss: 1.213, per_step_time: 1469ms, lr: 2.4086607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:52,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.44300 samples/s/p 0:50:39 } +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1184/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.4059823e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:55,639 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43454 samples/s/p 0:50:41 } +2024-07-26 00:22:58,596 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1186/ 1625], loss: 1.133, per_step_time: 1475ms, lr: 2.4033093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:22:58,596 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.42296 samples/s/p 0:50:44 } +2024-07-26 00:23:01,547 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1188/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 2.4006358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:01,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43406 samples/s/p 0:50:35 } +2024-07-26 00:23:04,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1190/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3979662e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:04,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43270 samples/s/p 0:50:33 } +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1192/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.3952991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:07,451 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43559 samples/s/p 0:50:28 } +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1194/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 2.3926336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:10,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.3% |███████████████████████████████████████████ | 5.43620 samples/s/p 0:50:25 } +2024-07-26 00:23:13,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1196/ 1625], loss: 1.041, per_step_time: 1472ms, lr: 2.3899709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:13,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43453 samples/s/p 0:50:23 } +2024-07-26 00:23:16,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1198/ 1625], loss: 0.980, per_step_time: 1472ms, lr: 2.38731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:16,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43441 samples/s/p 0:50:20 } +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1200/ 1625], loss: 1.066, per_step_time: 1484ms, lr: 2.3846521e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:19,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.38774 samples/s/p 0:50:43 } +2024-07-26 00:23:22,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1202/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 2.3819962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:22,232 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43317 samples/s/p 0:50:15 } +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1204/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 2.3793439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:25,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43918 samples/s/p 0:50:09 } +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1206/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 2.3766931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:28,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43672 samples/s/p 0:50:07 } +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1208/ 1625], loss: 1.045, per_step_time: 1472ms, lr: 2.374045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:31,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43421 samples/s/p 0:50:06 } +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1210/ 1625], loss: 1.250, per_step_time: 1472ms, lr: 2.3713997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:34,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.4% |███████████████████████████████████████████ | 5.43156 samples/s/p 0:50:04 } +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1212/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 2.3687567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:36,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43770 samples/s/p 0:49:58 } +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1214/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 2.3661146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:39,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43123 samples/s/p 0:49:58 } +2024-07-26 00:23:42,887 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1216/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 2.363476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:42,888 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43333 samples/s/p 0:49:54 } +2024-07-26 00:23:45,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1218/ 1625], loss: 1.226, per_step_time: 1472ms, lr: 2.3608425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:45,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43320 samples/s/p 0:49:51 } +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1220/ 1625], loss: 1.270, per_step_time: 1473ms, lr: 2.3582083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:48,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.42925 samples/s/p 0:49:51 } +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1222/ 1625], loss: 1.251, per_step_time: 1470ms, lr: 2.3555756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:51,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43918 samples/s/p 0:49:42 } +2024-07-26 00:23:54,693 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1224/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 2.3529483e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:54,694 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.43370 samples/s/p 0:49:42 } +2024-07-26 00:23:57,648 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1226/ 1625], loss: 1.151, per_step_time: 1474ms, lr: 2.3503226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:23:57,649 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.5% |███████████████████████████████████████████ | 5.42685 samples/s/p 0:49:43 } +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1228/ 1625], loss: 1.219, per_step_time: 1473ms, lr: 2.3476969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:00,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.42890 samples/s/p 0:49:39 } +2024-07-26 00:24:03,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1230/ 1625], loss: 1.210, per_step_time: 1472ms, lr: 2.3450757e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:03,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43144 samples/s/p 0:49:35 } +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1232/ 1625], loss: 1.229, per_step_time: 1472ms, lr: 2.3424568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:06,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43385 samples/s/p 0:49:31 } +2024-07-26 00:24:09,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1234/ 1625], loss: 1.236, per_step_time: 1470ms, lr: 2.3398406e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:09,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.44150 samples/s/p 0:49:23 } +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1236/ 1625], loss: 0.972, per_step_time: 1470ms, lr: 2.3372272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:12,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43918 samples/s/p 0:49:22 } +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1238/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 2.3346147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:15,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43849 samples/s/p 0:49:19 } +2024-07-26 00:24:18,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1240/ 1625], loss: 1.348, per_step_time: 1472ms, lr: 2.3320054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:18,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43278 samples/s/p 0:49:19 } +2024-07-26 00:24:21,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1242/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 2.3293978e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:21,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.6% |███████████████████████████████████████████ | 5.43119 samples/s/p 0:49:17 } +2024-07-26 00:24:24,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1244/ 1625], loss: 1.309, per_step_time: 1472ms, lr: 2.326794e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:24,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43230 samples/s/p 0:49:14 } +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1246/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 2.3241914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:27,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43595 samples/s/p 0:49:09 } +2024-07-26 00:24:30,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1248/ 1625], loss: 1.277, per_step_time: 1474ms, lr: 2.3215916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:30,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42583 samples/s/p 0:49:11 } +2024-07-26 00:24:33,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1250/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 2.3189946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:33,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43225 samples/s/p 0:49:05 } +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1252/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 2.3164002e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:36,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43288 samples/s/p 0:49:02 } +2024-07-26 00:24:38,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1254/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 2.3138073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:38,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43507 samples/s/p 0:48:57 } +2024-07-26 00:24:41,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1256/ 1625], loss: 1.316, per_step_time: 1474ms, lr: 2.3112189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:41,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.42563 samples/s/p 0:49:00 } +2024-07-26 00:24:44,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1258/ 1625], loss: 0.945, per_step_time: 1472ms, lr: 2.3086304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:44,880 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.7% |███████████████████████████████████████████ | 5.43239 samples/s/p 0:48:53 } +2024-07-26 00:24:47,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1260/ 1625], loss: 1.120, per_step_time: 1470ms, lr: 2.3060452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:47,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44042 samples/s/p 0:48:46 } +2024-07-26 00:24:50,782 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1262/ 1625], loss: 1.269, per_step_time: 1474ms, lr: 2.3034638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:50,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.42694 samples/s/p 0:48:50 } +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1264/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 2.3008822e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:53,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43325 samples/s/p 0:48:44 } +2024-07-26 00:24:56,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1266/ 1625], loss: 1.252, per_step_time: 1471ms, lr: 2.298304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:56,684 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43744 samples/s/p 0:48:39 } +2024-07-26 00:24:59,634 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1268/ 1625], loss: 1.152, per_step_time: 1472ms, lr: 2.295731e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:24:59,635 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43439 samples/s/p 0:48:37 } +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1270/ 1625], loss: 0.994, per_step_time: 1470ms, lr: 2.2931574e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:02,583 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43901 samples/s/p 0:48:32 } +2024-07-26 00:25:05,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1272/ 1625], loss: 1.139, per_step_time: 1469ms, lr: 2.290587e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:05,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.44428 samples/s/p 0:48:26 } +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1274/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 2.2880185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:08,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.8% |███████████████████████████████████████████ | 5.43796 samples/s/p 0:48:26 } +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1276/ 1625], loss: 1.382, per_step_time: 1473ms, lr: 2.2854533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:11,433 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42869 samples/s/p 0:48:28 } +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1278/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 2.2828908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:14,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43470 samples/s/p 0:48:22 } +2024-07-26 00:25:17,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1280/ 1625], loss: 1.104, per_step_time: 1469ms, lr: 2.28033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:17,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.44292 samples/s/p 0:48:15 } +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1282/ 1625], loss: 1.224, per_step_time: 1470ms, lr: 2.2777717e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:20,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43917 samples/s/p 0:48:14 } +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1284/ 1625], loss: 1.165, per_step_time: 1471ms, lr: 2.275216e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:23,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43693 samples/s/p 0:48:12 } +2024-07-26 00:25:26,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1286/ 1625], loss: 1.319, per_step_time: 1473ms, lr: 2.2726622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:26,184 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.42797 samples/s/p 0:48:14 } +2024-07-26 00:25:29,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1288/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 2.2701108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:29,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43596 samples/s/p 0:48:07 } +2024-07-26 00:25:32,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1290/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 2.267563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:32,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 87.9% |███████████████████████████████████████████ | 5.43833 samples/s/p 0:48:03 } +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1292/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 2.265017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:35,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43674 samples/s/p 0:48:01 } +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1294/ 1625], loss: 1.176, per_step_time: 1472ms, lr: 2.2624724e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:37,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43475 samples/s/p 0:47:59 } +2024-07-26 00:25:40,940 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1296/ 1625], loss: 1.243, per_step_time: 1474ms, lr: 2.2599315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:40,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.42506 samples/s/p 0:48:01 } +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1298/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 2.2573931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:43,890 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |███████████████████████████████████████████ | 5.43678 samples/s/p 0:47:52 } +2024-07-26 00:25:46,841 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1300/ 1625], loss: 1.195, per_step_time: 1472ms, lr: 2.254859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:46,841 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43436 samples/s/p 0:47:50 } +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1302/ 1625], loss: 1.332, per_step_time: 1473ms, lr: 2.2523225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:49,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.42913 samples/s/p 0:47:50 } +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1304/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.2497911e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:52,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43525 samples/s/p 0:47:44 } +2024-07-26 00:25:55,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1306/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 2.2472648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:55,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.43227 samples/s/p 0:47:42 } +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1308/ 1625], loss: 1.186, per_step_time: 1470ms, lr: 2.244736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:25:58,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.0% |████████████████████████████████████████████ | 5.44131 samples/s/p 0:47:35 } +2024-07-26 00:26:01,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1310/ 1625], loss: 1.267, per_step_time: 1475ms, lr: 2.2422114e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:01,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42091 samples/s/p 0:47:42 } +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1312/ 1625], loss: 1.190, per_step_time: 1473ms, lr: 2.239692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:04,558 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43039 samples/s/p 0:47:35 } +2024-07-26 00:26:07,509 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1314/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 2.237171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:07,510 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43353 samples/s/p 0:47:30 } +2024-07-26 00:26:10,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1316/ 1625], loss: 1.257, per_step_time: 1474ms, lr: 2.234656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:10,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42406 samples/s/p 0:47:32 } +2024-07-26 00:26:13,418 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1318/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 2.2321428e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:13,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43221 samples/s/p 0:47:25 } +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1320/ 1625], loss: 1.291, per_step_time: 1472ms, lr: 2.2296304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:16,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43186 samples/s/p 0:47:22 } +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1322/ 1625], loss: 1.075, per_step_time: 1474ms, lr: 2.2271213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:19,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.42530 samples/s/p 0:47:22 } +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1324/ 1625], loss: 1.172, per_step_time: 1473ms, lr: 2.224614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:22,281 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.1% |████████████████████████████████████████████ | 5.43069 samples/s/p 0:47:17 } +2024-07-26 00:26:25,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1326/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.2221093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:25,235 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42985 samples/s/p 0:47:14 } +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1328/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 2.2196073e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:28,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43124 samples/s/p 0:47:11 } +2024-07-26 00:26:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1330/ 1625], loss: 1.076, per_step_time: 1474ms, lr: 2.217108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:31,143 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.42648 samples/s/p 0:47:10 } +2024-07-26 00:26:34,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1332/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 2.21461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:34,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43485 samples/s/p 0:47:03 } +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1334/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 2.2121158e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:37,043 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43708 samples/s/p 0:46:59 } +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1336/ 1625], loss: 1.094, per_step_time: 1471ms, lr: 2.2096242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:39,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43518 samples/s/p 0:46:57 } +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1338/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 2.2071342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:42,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43478 samples/s/p 0:46:54 } +2024-07-26 00:26:45,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1340/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 2.204648e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:45,897 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.2% |████████████████████████████████████████████ | 5.43332 samples/s/p 0:46:52 } +2024-07-26 00:26:48,845 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1342/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 2.2021622e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:48,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43879 samples/s/p 0:46:46 } +2024-07-26 00:26:51,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1344/ 1625], loss: 1.084, per_step_time: 1473ms, lr: 2.1996816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:51,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.42963 samples/s/p 0:46:48 } +2024-07-26 00:26:54,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1346/ 1625], loss: 1.029, per_step_time: 1472ms, lr: 2.1971996e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:54,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43443 samples/s/p 0:46:42 } +2024-07-26 00:26:57,702 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1348/ 1625], loss: 1.028, per_step_time: 1472ms, lr: 2.1947226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:26:57,703 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43295 samples/s/p 0:46:40 } +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1350/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 2.192249e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:00,653 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43493 samples/s/p 0:46:36 } +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1352/ 1625], loss: 1.070, per_step_time: 1472ms, lr: 2.1897754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:03,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43475 samples/s/p 0:46:33 } +2024-07-26 00:27:06,554 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1354/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.1873045e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:06,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43588 samples/s/p 0:46:30 } +2024-07-26 00:27:09,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1356/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 2.1848386e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:09,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.3% |████████████████████████████████████████████ | 5.43579 samples/s/p 0:46:27 } +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1358/ 1625], loss: 1.043, per_step_time: 1470ms, lr: 2.182372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:12,454 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43956 samples/s/p 0:46:22 } +2024-07-26 00:27:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1360/ 1625], loss: 1.318, per_step_time: 1470ms, lr: 2.1799106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.44202 samples/s/p 0:46:18 } +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1362/ 1625], loss: 1.298, per_step_time: 1472ms, lr: 2.1774501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43376 samples/s/p 0:46:19 } +2024-07-26 00:27:21,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1364/ 1625], loss: 1.409, per_step_time: 1472ms, lr: 2.1749913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:21,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43396 samples/s/p 0:46:16 } +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1366/ 1625], loss: 1.025, per_step_time: 1472ms, lr: 2.1725377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:24,255 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43441 samples/s/p 0:46:13 } +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1368/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 2.1700848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:27,208 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43059 samples/s/p 0:46:12 } +2024-07-26 00:27:30,161 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1370/ 1625], loss: 1.246, per_step_time: 1473ms, lr: 2.1676337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:30,162 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.42938 samples/s/p 0:46:10 } +2024-07-26 00:27:33,110 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1372/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 2.1651854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:33,111 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.4% |████████████████████████████████████████████ | 5.43837 samples/s/p 0:46:02 } +2024-07-26 00:27:36,060 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1374/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 2.1627402e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:36,060 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43762 samples/s/p 0:46:00 } +2024-07-26 00:27:39,012 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1376/ 1625], loss: 1.118, per_step_time: 1472ms, lr: 2.160297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:39,012 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43358 samples/s/p 0:45:59 } +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1378/ 1625], loss: 1.070, per_step_time: 1471ms, lr: 2.1578562e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:41,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43508 samples/s/p 0:45:55 } +2024-07-26 00:27:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1380/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 2.1554192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43176 samples/s/p 0:45:54 } +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1382/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 2.1529827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:47,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43525 samples/s/p 0:45:49 } +2024-07-26 00:27:50,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1384/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 2.1505498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:50,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43195 samples/s/p 0:45:48 } +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1386/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 2.1481196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:53,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.42936 samples/s/p 0:45:46 } +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1388/ 1625], loss: 1.000, per_step_time: 1471ms, lr: 2.1456926e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:56,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.5% |████████████████████████████████████████████ | 5.43481 samples/s/p 0:45:40 } +2024-07-26 00:27:59,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1390/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 2.1432647e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:27:59,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.44080 samples/s/p 0:45:34 } +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1392/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 2.1408423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:02,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43398 samples/s/p 0:45:35 } +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1394/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 2.1384217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:05,573 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43655 samples/s/p 0:45:31 } +2024-07-26 00:28:08,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1396/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1360033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:08,527 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.42959 samples/s/p 0:45:31 } +2024-07-26 00:28:11,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1398/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 2.1335868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:11,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43769 samples/s/p 0:45:24 } +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1400/ 1625], loss: 1.095, per_step_time: 1471ms, lr: 2.1311748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:14,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43558 samples/s/p 0:45:22 } +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1402/ 1625], loss: 0.976, per_step_time: 1471ms, lr: 2.1287624e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:17,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.43685 samples/s/p 0:45:19 } +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1404/ 1625], loss: 1.053, per_step_time: 1473ms, lr: 2.1263554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:20,330 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.6% |████████████████████████████████████████████ | 5.42907 samples/s/p 0:45:20 } +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1406/ 1625], loss: 1.271, per_step_time: 1471ms, lr: 2.1239493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43631 samples/s/p 0:45:13 } +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1408/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 2.1215442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:26,231 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43448 samples/s/p 0:45:11 } +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1410/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 2.119145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:29,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43789 samples/s/p 0:45:06 } +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1412/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 2.1167457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:32,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43365 samples/s/p 0:45:06 } +2024-07-26 00:28:35,082 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1414/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 2.1143492e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:35,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43480 samples/s/p 0:45:02 } +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1416/ 1625], loss: 1.008, per_step_time: 1471ms, lr: 2.111955e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:38,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43575 samples/s/p 0:44:59 } +2024-07-26 00:28:40,982 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1418/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 2.1095645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:40,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43719 samples/s/p 0:44:55 } +2024-07-26 00:28:43,931 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1420/ 1625], loss: 1.351, per_step_time: 1470ms, lr: 2.1071755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:43,932 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.7% |████████████████████████████████████████████ | 5.43932 samples/s/p 0:44:51 } +2024-07-26 00:28:46,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1422/ 1625], loss: 1.128, per_step_time: 1471ms, lr: 2.1047895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:46,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43614 samples/s/p 0:44:50 } +2024-07-26 00:28:49,830 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1424/ 1625], loss: 0.926, per_step_time: 1471ms, lr: 2.1024048e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:49,831 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43806 samples/s/p 0:44:46 } +2024-07-26 00:28:52,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1426/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 2.1000246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:52,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43706 samples/s/p 0:44:43 } +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1428/ 1625], loss: 1.217, per_step_time: 1473ms, lr: 2.0976454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:55,735 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.42766 samples/s/p 0:44:45 } +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1430/ 1625], loss: 1.302, per_step_time: 1470ms, lr: 2.0952687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:28:58,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.44018 samples/s/p 0:44:36 } +2024-07-26 00:29:01,635 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1432/ 1625], loss: 0.986, per_step_time: 1472ms, lr: 2.0928962e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:01,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43253 samples/s/p 0:44:37 } +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1434/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 2.0905238e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:04,586 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43512 samples/s/p 0:44:32 } +2024-07-26 00:29:07,537 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1436/ 1625], loss: 1.103, per_step_time: 1472ms, lr: 2.088154e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:07,538 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43350 samples/s/p 0:44:30 } +2024-07-26 00:29:10,488 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1438/ 1625], loss: 1.223, per_step_time: 1471ms, lr: 2.0857894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:10,489 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.8% |████████████████████████████████████████████ | 5.43506 samples/s/p 0:44:27 } +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1440/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 2.0834239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:13,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43347 samples/s/p 0:44:24 } +2024-07-26 00:29:16,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1442/ 1625], loss: 0.973, per_step_time: 1471ms, lr: 2.0810635e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:16,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43746 samples/s/p 0:44:20 } +2024-07-26 00:29:19,341 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1444/ 1625], loss: 1.023, per_step_time: 1472ms, lr: 2.0787043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:19,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43272 samples/s/p 0:44:19 } +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1446/ 1625], loss: 1.073, per_step_time: 1471ms, lr: 2.0763464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:22,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43525 samples/s/p 0:44:15 } +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1448/ 1625], loss: 0.923, per_step_time: 1472ms, lr: 2.073995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:25,245 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43119 samples/s/p 0:44:14 } +2024-07-26 00:29:28,197 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1450/ 1625], loss: 1.188, per_step_time: 1472ms, lr: 2.0716423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:28,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43230 samples/s/p 0:44:10 } +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1452/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 2.0692923e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:31,148 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43647 samples/s/p 0:44:05 } +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1454/ 1625], loss: 1.408, per_step_time: 1472ms, lr: 2.0669459e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:34,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 88.9% |████████████████████████████████████████████ | 5.43281 samples/s/p 0:44:04 } +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1456/ 1625], loss: 1.039, per_step_time: 1472ms, lr: 2.0646019e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:37,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43308 samples/s/p 0:44:01 } +2024-07-26 00:29:40,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1458/ 1625], loss: 1.205, per_step_time: 1473ms, lr: 2.0622606e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:40,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43046 samples/s/p 0:43:59 } +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1460/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 2.059921e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:42,956 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43553 samples/s/p 0:43:54 } +2024-07-26 00:29:45,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1462/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 2.0575849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:45,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43880 samples/s/p 0:43:49 } +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1464/ 1625], loss: 1.284, per_step_time: 1472ms, lr: 2.0552507e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:48,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43438 samples/s/p 0:43:49 } +2024-07-26 00:29:51,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1466/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 2.0529178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:51,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.42755 samples/s/p 0:43:49 } +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1468/ 1625], loss: 1.038, per_step_time: 1472ms, lr: 2.0505895e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:54,764 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43200 samples/s/p 0:43:44 } +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1470/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 2.048264e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:29:57,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.0% |████████████████████████████████████████████ | 5.43052 samples/s/p 0:43:42 } +2024-07-26 00:30:00,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1472/ 1625], loss: 1.140, per_step_time: 1473ms, lr: 2.045938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:00,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43012 samples/s/p 0:43:39 } +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1474/ 1625], loss: 1.049, per_step_time: 1473ms, lr: 2.0436166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:03,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.42965 samples/s/p 0:43:36 } +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1476/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 2.0412986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:06,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43082 samples/s/p 0:43:33 } +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1478/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 2.0389798e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:09,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44111 samples/s/p 0:43:25 } +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1480/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 2.0366654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:12,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43740 samples/s/p 0:43:24 } +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1482/ 1625], loss: 1.258, per_step_time: 1470ms, lr: 2.034355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:15,422 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44140 samples/s/p 0:43:19 } +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1484/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.032044e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:18,371 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.43861 samples/s/p 0:43:17 } +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1486/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 2.0297382e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:21,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.1% |████████████████████████████████████████████ | 5.44150 samples/s/p 0:43:13 } +2024-07-26 00:30:24,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1488/ 1625], loss: 1.273, per_step_time: 1472ms, lr: 2.0274342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:24,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43425 samples/s/p 0:43:13 } +2024-07-26 00:30:27,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1490/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 2.025131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:27,218 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43981 samples/s/p 0:43:08 } +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1492/ 1625], loss: 1.218, per_step_time: 1471ms, lr: 2.0228326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:30,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43561 samples/s/p 0:43:07 } +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1494/ 1625], loss: 1.180, per_step_time: 1471ms, lr: 2.0205355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:33,118 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43659 samples/s/p 0:43:03 } +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1496/ 1625], loss: 1.193, per_step_time: 1470ms, lr: 2.0182401e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:36,065 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.44158 samples/s/p 0:42:58 } +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1498/ 1625], loss: 1.111, per_step_time: 1471ms, lr: 2.0159487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43704 samples/s/p 0:42:57 } +2024-07-26 00:30:41,964 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1500/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 2.0136595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:41,965 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43684 samples/s/p 0:42:55 } +2024-07-26 00:30:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1502/ 1625], loss: 1.233, per_step_time: 1472ms, lr: 2.0113716e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:44,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.2% |████████████████████████████████████████████ | 5.43468 samples/s/p 0:42:53 } +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1504/ 1625], loss: 1.056, per_step_time: 1470ms, lr: 2.0090874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:47,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43966 samples/s/p 0:42:47 } +2024-07-26 00:30:50,812 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1506/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 2.0068057e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:50,813 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43940 samples/s/p 0:42:44 } +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1508/ 1625], loss: 1.013, per_step_time: 1471ms, lr: 2.0045259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:53,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43700 samples/s/p 0:42:43 } +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1510/ 1625], loss: 1.035, per_step_time: 1470ms, lr: 2.0022485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:56,710 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.44011 samples/s/p 0:42:38 } +2024-07-26 00:30:59,660 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1512/ 1625], loss: 1.242, per_step_time: 1471ms, lr: 1.9999738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:30:59,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43716 samples/s/p 0:42:37 } +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1514/ 1625], loss: 1.071, per_step_time: 1471ms, lr: 1.9977024e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:02,610 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43751 samples/s/p 0:42:34 } +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1516/ 1625], loss: 1.226, per_step_time: 1471ms, lr: 1.9954318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:05,559 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43834 samples/s/p 0:42:30 } +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1518/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.9931658e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:08,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.3% |████████████████████████████████████████████ | 5.43043 samples/s/p 0:42:31 } +2024-07-26 00:31:11,461 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1520/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.9909023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:11,461 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43905 samples/s/p 0:42:24 } +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1522/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.988638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:14,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43717 samples/s/p 0:42:22 } +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1524/ 1625], loss: 1.122, per_step_time: 1470ms, lr: 1.9863796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:17,358 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44091 samples/s/p 0:42:17 } +2024-07-26 00:31:20,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1526/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.9841232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:20,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.44124 samples/s/p 0:42:14 } +2024-07-26 00:31:23,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1528/ 1625], loss: 1.175, per_step_time: 1471ms, lr: 1.9818672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:23,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43507 samples/s/p 0:42:14 } +2024-07-26 00:31:26,205 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1530/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.9796166e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:26,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43820 samples/s/p 0:42:10 } +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1532/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.977366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:29,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.43411 samples/s/p 0:42:09 } +2024-07-26 00:31:32,111 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1534/ 1625], loss: 1.170, per_step_time: 1473ms, lr: 1.9751183e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:32,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.4% |████████████████████████████████████████████ | 5.42963 samples/s/p 0:42:08 } +2024-07-26 00:31:35,062 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1536/ 1625], loss: 1.049, per_step_time: 1472ms, lr: 1.9728745e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:35,063 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43467 samples/s/p 0:42:03 } +2024-07-26 00:31:38,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1538/ 1625], loss: 1.069, per_step_time: 1472ms, lr: 1.9706317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:38,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43303 samples/s/p 0:42:00 } +2024-07-26 00:31:40,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1540/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.9683916e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:40,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43279 samples/s/p 0:41:58 } +2024-07-26 00:31:43,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1542/ 1625], loss: 1.079, per_step_time: 1473ms, lr: 1.9661557e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:43,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43109 samples/s/p 0:41:55 } +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1544/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.9639208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:46,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.42856 samples/s/p 0:41:54 } +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1546/ 1625], loss: 1.124, per_step_time: 1472ms, lr: 1.9616884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:49,826 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43244 samples/s/p 0:41:49 } +2024-07-26 00:31:52,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1548/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.9594595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:52,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.44093 samples/s/p 0:41:42 } +2024-07-26 00:31:55,723 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1550/ 1625], loss: 1.286, per_step_time: 1471ms, lr: 1.9572321e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:55,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.5% |████████████████████████████████████████████ | 5.43688 samples/s/p 0:41:41 } +2024-07-26 00:31:58,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1552/ 1625], loss: 1.164, per_step_time: 1473ms, lr: 1.9550075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:31:58,677 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43021 samples/s/p 0:41:41 } +2024-07-26 00:32:01,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1554/ 1625], loss: 0.970, per_step_time: 1471ms, lr: 1.9527856e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:01,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43813 samples/s/p 0:41:34 } +2024-07-26 00:32:04,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1556/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.9505653e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:04,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43499 samples/s/p 0:41:33 } +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1558/ 1625], loss: 1.141, per_step_time: 1471ms, lr: 1.9483475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:07,526 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43712 samples/s/p 0:41:29 } +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1560/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.9461334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:10,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43115 samples/s/p 0:41:29 } +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1562/ 1625], loss: 1.074, per_step_time: 1470ms, lr: 1.9439217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:13,427 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.44055 samples/s/p 0:41:22 } +2024-07-26 00:32:16,383 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1564/ 1625], loss: 1.135, per_step_time: 1473ms, lr: 1.941711e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:16,384 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.42775 samples/s/p 0:41:25 } +2024-07-26 00:32:19,339 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1566/ 1625], loss: 1.263, per_step_time: 1471ms, lr: 1.9395043e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:19,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43573 samples/s/p 0:41:18 } +2024-07-26 00:32:22,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1568/ 1625], loss: 1.125, per_step_time: 1472ms, lr: 1.9372997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:22,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.6% |████████████████████████████████████████████ | 5.43412 samples/s/p 0:41:16 } +2024-07-26 00:32:25,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1570/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.9350991e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:25,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43817 samples/s/p 0:41:11 } +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1572/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.932897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:28,191 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43351 samples/s/p 0:41:10 } +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1574/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.9307017e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:31,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43595 samples/s/p 0:41:06 } +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1576/ 1625], loss: 1.062, per_step_time: 1471ms, lr: 1.9285076e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:34,092 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43669 samples/s/p 0:41:03 } +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1578/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.926313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:37,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43821 samples/s/p 0:40:59 } +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1580/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.9241247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:39,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43418 samples/s/p 0:40:58 } +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1582/ 1625], loss: 1.082, per_step_time: 1472ms, lr: 1.921938e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:42,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43257 samples/s/p 0:40:56 } +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1584/ 1625], loss: 1.121, per_step_time: 1471ms, lr: 1.9197541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:45,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.7% |████████████████████████████████████████████ | 5.43525 samples/s/p 0:40:52 } +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1586/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.917571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:48,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.44009 samples/s/p 0:40:47 } +2024-07-26 00:32:51,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1588/ 1625], loss: 1.420, per_step_time: 1471ms, lr: 1.9153913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:51,793 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43760 samples/s/p 0:40:45 } +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1590/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.913215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:54,743 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43596 samples/s/p 0:40:42 } +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1592/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 1.9110398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:32:57,692 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43896 samples/s/p 0:40:38 } +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1594/ 1625], loss: 1.066, per_step_time: 1470ms, lr: 1.908868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:00,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43992 samples/s/p 0:40:35 } +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1596/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.9066994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:03,591 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43413 samples/s/p 0:40:34 } +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1598/ 1625], loss: 1.161, per_step_time: 1473ms, lr: 1.904531e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:06,546 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.42780 samples/s/p 0:40:34 } +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1600/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.9023669e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:09,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.8% |████████████████████████████████████████████ | 5.43181 samples/s/p 0:40:30 } +2024-07-26 00:33:12,449 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1602/ 1625], loss: 1.007, per_step_time: 1472ms, lr: 1.9002052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:12,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43416 samples/s/p 0:40:26 } +2024-07-26 00:33:15,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1604/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.8980454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:15,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43476 samples/s/p 0:40:22 } +2024-07-26 00:33:18,351 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1606/ 1625], loss: 1.272, per_step_time: 1471ms, lr: 1.8958883e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:18,352 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43527 samples/s/p 0:40:19 } +2024-07-26 00:33:21,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1608/ 1625], loss: 1.072, per_step_time: 1471ms, lr: 1.8937328e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:21,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43498 samples/s/p 0:40:16 } +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1610/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 1.8915816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:24,254 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43302 samples/s/p 0:40:14 } +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1612/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.8894331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:27,206 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43288 samples/s/p 0:40:11 } +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1614/ 1625], loss: 1.069, per_step_time: 1471ms, lr: 1.8872854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:30,157 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.43490 samples/s/p 0:40:08 } +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1616/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.8851403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:33,112 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 89.9% |████████████████████████████████████████████ | 5.42759 samples/s/p 0:40:08 } +2024-07-26 00:33:36,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1618/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.8829994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:36,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.42994 samples/s/p 0:40:04 } +2024-07-26 00:33:39,014 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1620/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.8808604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:39,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43778 samples/s/p 0:39:58 } +2024-07-26 00:33:41,965 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1622/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.8787222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:41,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43469 samples/s/p 0:39:56 } +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 9/ 10], step:[ 1624/ 1625], loss: 1.007, per_step_time: 1471ms, lr: 1.8765884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:44,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |████████████████████████████████████████████ | 5.43747 samples/s/p 0:39:52 } +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.874457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:47,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43567 samples/s/p 0:39:50 } +2024-07-26 00:33:50,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 3/ 1625], loss: 1.203, per_step_time: 1472ms, lr: 1.8723283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:50,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43312 samples/s/p 0:39:48 } +2024-07-26 00:33:53,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 5/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.8702005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:53,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.43265 samples/s/p 0:39:45 } +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 7/ 1625], loss: 1.157, per_step_time: 1475ms, lr: 1.8680762e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:56,726 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.0% |█████████████████████████████████████████████ | 5.42331 samples/s/p 0:39:46 } +2024-07-26 00:33:59,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 9/ 1625], loss: 1.079, per_step_time: 1472ms, lr: 1.8659543e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:33:59,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43332 samples/s/p 0:39:39 } +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 11/ 1625], loss: 1.025, per_step_time: 1470ms, lr: 1.8638343e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:02,626 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43956 samples/s/p 0:39:33 } +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 13/ 1625], loss: 1.202, per_step_time: 1474ms, lr: 1.8617186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:05,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.42481 samples/s/p 0:39:37 } +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 15/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.8596038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:08,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44013 samples/s/p 0:39:27 } +2024-07-26 00:34:11,478 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 17/ 1625], loss: 0.964, per_step_time: 1470ms, lr: 1.8574915e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:11,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43923 samples/s/p 0:39:25 } +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 19/ 1625], loss: 1.044, per_step_time: 1472ms, lr: 1.8553835e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:14,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43394 samples/s/p 0:39:24 } +2024-07-26 00:34:17,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 21/ 1625], loss: 1.285, per_step_time: 1469ms, lr: 1.8532755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:17,377 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.44297 samples/s/p 0:39:17 } +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 23/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.8511719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:20,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.1% |█████████████████████████████████████████████ | 5.43343 samples/s/p 0:39:18 } +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 25/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.84907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:23,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43351 samples/s/p 0:39:15 } +2024-07-26 00:34:26,230 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 27/ 1625], loss: 1.088, per_step_time: 1471ms, lr: 1.8469707e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:26,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43632 samples/s/p 0:39:11 } +2024-07-26 00:34:29,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 29/ 1625], loss: 1.190, per_step_time: 1472ms, lr: 1.8448749e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:29,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43140 samples/s/p 0:39:10 } +2024-07-26 00:34:32,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 31/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.8427816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:32,134 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43497 samples/s/p 0:39:06 } +2024-07-26 00:34:35,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 33/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.8406874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:35,084 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43633 samples/s/p 0:39:02 } +2024-07-26 00:34:38,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 35/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.8385986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:38,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43610 samples/s/p 0:38:59 } +2024-07-26 00:34:40,984 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 37/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.836514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:40,985 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43476 samples/s/p 0:38:57 } +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 39/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.8344285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:43,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.2% |█████████████████████████████████████████████ | 5.43699 samples/s/p 0:38:53 } +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 41/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.8323465e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:46,885 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43636 samples/s/p 0:38:50 } +2024-07-26 00:34:49,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 43/ 1625], loss: 1.283, per_step_time: 1471ms, lr: 1.8302687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:49,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43489 samples/s/p 0:38:48 } +2024-07-26 00:34:52,785 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 45/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.8281928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:52,786 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43687 samples/s/p 0:38:44 } +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 47/ 1625], loss: 1.103, per_step_time: 1473ms, lr: 1.8261185e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:55,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43058 samples/s/p 0:38:44 } +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 49/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.8240469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:34:58,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43321 samples/s/p 0:38:40 } +2024-07-26 00:35:01,642 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 51/ 1625], loss: 1.251, per_step_time: 1472ms, lr: 1.8219787e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:01,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43345 samples/s/p 0:38:37 } +2024-07-26 00:35:04,597 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 53/ 1625], loss: 1.175, per_step_time: 1474ms, lr: 1.8199123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:04,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.42655 samples/s/p 0:38:37 } +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 55/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.8178475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:07,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.3% |█████████████████████████████████████████████ | 5.43703 samples/s/p 0:38:30 } +2024-07-26 00:35:10,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 57/ 1625], loss: 1.223, per_step_time: 1470ms, lr: 1.8157862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:10,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.44163 samples/s/p 0:38:25 } +2024-07-26 00:35:13,446 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 59/ 1625], loss: 0.952, per_step_time: 1471ms, lr: 1.8137284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:13,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43538 samples/s/p 0:38:24 } +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 61/ 1625], loss: 1.110, per_step_time: 1472ms, lr: 1.8116714e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:16,399 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43248 samples/s/p 0:38:23 } +2024-07-26 00:35:19,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 63/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.8096171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:19,351 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43362 samples/s/p 0:38:19 } +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 65/ 1625], loss: 0.928, per_step_time: 1472ms, lr: 1.8075671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:22,303 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43134 samples/s/p 0:38:17 } +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 67/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.8055188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:25,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42716 samples/s/p 0:38:16 } +2024-07-26 00:35:28,214 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 69/ 1625], loss: 1.183, per_step_time: 1474ms, lr: 1.8034722e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:28,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42472 samples/s/p 0:38:14 } +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 71/ 1625], loss: 1.257, per_step_time: 1473ms, lr: 1.8014273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:31,169 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.42851 samples/s/p 0:38:10 } +2024-07-26 00:35:34,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 73/ 1625], loss: 1.043, per_step_time: 1471ms, lr: 1.7993868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:34,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.4% |█████████████████████████████████████████████ | 5.43537 samples/s/p 0:38:04 } +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 75/ 1625], loss: 0.976, per_step_time: 1474ms, lr: 1.7973497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:37,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42533 samples/s/p 0:38:05 } +2024-07-26 00:35:40,026 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 77/ 1625], loss: 1.014, per_step_time: 1471ms, lr: 1.7953125e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:40,027 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43745 samples/s/p 0:37:57 } +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 79/ 1625], loss: 1.228, per_step_time: 1472ms, lr: 1.793279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:42,978 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43344 samples/s/p 0:37:56 } +2024-07-26 00:35:45,929 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 81/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.7912497e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:45,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43445 samples/s/p 0:37:52 } +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 83/ 1625], loss: 1.205, per_step_time: 1472ms, lr: 1.7892187e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:48,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43172 samples/s/p 0:37:51 } +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 85/ 1625], loss: 1.025, per_step_time: 1473ms, lr: 1.7871937e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:51,835 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43063 samples/s/p 0:37:48 } +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 87/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.7851713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:54,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.43074 samples/s/p 0:37:45 } +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 89/ 1625], loss: 1.154, per_step_time: 1473ms, lr: 1.783149e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:35:57,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.5% |█████████████████████████████████████████████ | 5.42863 samples/s/p 0:37:43 } +2024-07-26 00:36:00,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 91/ 1625], loss: 0.966, per_step_time: 1469ms, lr: 1.7811317e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:00,689 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.44289 samples/s/p 0:37:34 } +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 93/ 1625], loss: 1.217, per_step_time: 1478ms, lr: 1.7791153e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:03,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.41206 samples/s/p 0:37:44 } +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 95/ 1625], loss: 1.083, per_step_time: 1473ms, lr: 1.7771025e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.42849 samples/s/p 0:37:34 } +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 97/ 1625], loss: 1.111, per_step_time: 1470ms, lr: 1.7750922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:09,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43961 samples/s/p 0:37:27 } +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 99/ 1625], loss: 1.211, per_step_time: 1471ms, lr: 1.7730837e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43587 samples/s/p 0:37:25 } +2024-07-26 00:36:15,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 101/ 1625], loss: 0.986, per_step_time: 1471ms, lr: 1.7710777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:15,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43740 samples/s/p 0:37:22 } +2024-07-26 00:36:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 103/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.7690743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43953 samples/s/p 0:37:18 } +2024-07-26 00:36:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 105/ 1625], loss: 1.178, per_step_time: 1472ms, lr: 1.7670752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:21,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.6% |█████████████████████████████████████████████ | 5.43305 samples/s/p 0:37:18 } +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 107/ 1625], loss: 1.195, per_step_time: 1471ms, lr: 1.7650761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:24,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43482 samples/s/p 0:37:14 } +2024-07-26 00:36:27,256 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 109/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.7630806e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:27,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43570 samples/s/p 0:37:11 } +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 111/ 1625], loss: 1.137, per_step_time: 1473ms, lr: 1.7610876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:30,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43002 samples/s/p 0:37:10 } +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 113/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.759098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:33,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43098 samples/s/p 0:37:07 } +2024-07-26 00:36:36,115 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 115/ 1625], loss: 1.170, per_step_time: 1472ms, lr: 1.7571094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:36,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43223 samples/s/p 0:37:03 } +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 117/ 1625], loss: 1.163, per_step_time: 1470ms, lr: 1.7551233e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:39,064 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43857 samples/s/p 0:36:58 } +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 119/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7531424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:42,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43110 samples/s/p 0:36:58 } +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 121/ 1625], loss: 1.143, per_step_time: 1470ms, lr: 1.7511607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:44,966 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.7% |█████████████████████████████████████████████ | 5.43895 samples/s/p 0:36:52 } +2024-07-26 00:36:47,916 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 123/ 1625], loss: 1.229, per_step_time: 1471ms, lr: 1.7491832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:47,917 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43542 samples/s/p 0:36:50 } +2024-07-26 00:36:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 125/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.7472075e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43782 samples/s/p 0:36:46 } +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 127/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.7452353e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43535 samples/s/p 0:36:44 } +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 129/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.7432646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:56,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43906 samples/s/p 0:36:40 } +2024-07-26 00:36:59,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 131/ 1625], loss: 1.122, per_step_time: 1471ms, lr: 1.7412976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:36:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43757 samples/s/p 0:36:38 } +2024-07-26 00:37:02,663 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 133/ 1625], loss: 1.078, per_step_time: 1471ms, lr: 1.7393314e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:02,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43801 samples/s/p 0:36:34 } +2024-07-26 00:37:05,617 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 135/ 1625], loss: 1.207, per_step_time: 1473ms, lr: 1.7373695e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:05,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43087 samples/s/p 0:36:34 } +2024-07-26 00:37:08,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 137/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.7354103e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:08,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.8% |█████████████████████████████████████████████ | 5.43239 samples/s/p 0:36:31 } +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 139/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.733451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:11,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43454 samples/s/p 0:36:27 } +2024-07-26 00:37:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 141/ 1625], loss: 1.361, per_step_time: 1471ms, lr: 1.7314977e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:14,472 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43510 samples/s/p 0:36:24 } +2024-07-26 00:37:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 143/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.7295454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43102 samples/s/p 0:36:23 } +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 145/ 1625], loss: 1.144, per_step_time: 1473ms, lr: 1.7275947e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:20,378 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43039 samples/s/p 0:36:20 } +2024-07-26 00:37:23,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 147/ 1625], loss: 0.965, per_step_time: 1474ms, lr: 1.7256475e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:23,335 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42419 samples/s/p 0:36:19 } +2024-07-26 00:37:26,287 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 149/ 1625], loss: 1.017, per_step_time: 1473ms, lr: 1.7237029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:26,287 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43107 samples/s/p 0:36:14 } +2024-07-26 00:37:29,242 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 151/ 1625], loss: 1.189, per_step_time: 1473ms, lr: 1.7217609e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:29,242 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.42849 samples/s/p 0:36:12 } +2024-07-26 00:37:32,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 153/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.7198215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 90.9% |█████████████████████████████████████████████ | 5.43404 samples/s/p 0:36:07 } +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 155/ 1625], loss: 1.184, per_step_time: 1472ms, lr: 1.7178838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:35,146 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43198 samples/s/p 0:36:04 } +2024-07-26 00:37:38,094 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 157/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.7159505e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:38,095 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43919 samples/s/p 0:35:59 } +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 159/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.7140179e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:41,046 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43410 samples/s/p 0:35:58 } +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 161/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.712088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:43,995 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43793 samples/s/p 0:35:53 } +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 163/ 1625], loss: 1.064, per_step_time: 1471ms, lr: 1.7101625e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:46,945 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43590 samples/s/p 0:35:51 } +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 165/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.7082368e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:49,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43460 samples/s/p 0:35:49 } +2024-07-26 00:37:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 167/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.7063146e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:52,847 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43711 samples/s/p 0:35:45 } +2024-07-26 00:37:55,799 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 169/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.7043969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:55,800 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.0% |█████████████████████████████████████████████ | 5.43092 samples/s/p 0:35:44 } +2024-07-26 00:37:58,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 171/ 1625], loss: 1.274, per_step_time: 1472ms, lr: 1.702479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:37:58,751 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43422 samples/s/p 0:35:40 } +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 173/ 1625], loss: 1.247, per_step_time: 1471ms, lr: 1.7005664e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:01,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43755 samples/s/p 0:35:36 } +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 175/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.6986538e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:04,652 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43310 samples/s/p 0:35:35 } +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 177/ 1625], loss: 1.042, per_step_time: 1472ms, lr: 1.6967438e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:07,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43305 samples/s/p 0:35:32 } +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 179/ 1625], loss: 1.098, per_step_time: 1470ms, lr: 1.6948381e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:10,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44001 samples/s/p 0:35:26 } +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 181/ 1625], loss: 1.048, per_step_time: 1469ms, lr: 1.6929341e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:13,498 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.44355 samples/s/p 0:35:22 } +2024-07-26 00:38:16,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 183/ 1625], loss: 1.265, per_step_time: 1470ms, lr: 1.691031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:16,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43850 samples/s/p 0:35:21 } +2024-07-26 00:38:19,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 185/ 1625], loss: 1.118, per_step_time: 1473ms, lr: 1.6891331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:19,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.1% |█████████████████████████████████████████████ | 5.43046 samples/s/p 0:35:21 } +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 187/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.6872377e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:22,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43578 samples/s/p 0:35:16 } +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 189/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.6853432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:25,307 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43472 samples/s/p 0:35:13 } +2024-07-26 00:38:28,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 191/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.6834522e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:28,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43196 samples/s/p 0:35:11 } +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 193/ 1625], loss: 1.224, per_step_time: 1474ms, lr: 1.6815638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:31,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.42565 samples/s/p 0:35:11 } +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 195/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.6796771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:34,165 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43650 samples/s/p 0:35:04 } +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 197/ 1625], loss: 1.182, per_step_time: 1472ms, lr: 1.6777931e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43294 samples/s/p 0:35:02 } +2024-07-26 00:38:40,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 199/ 1625], loss: 1.009, per_step_time: 1471ms, lr: 1.6759124e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:40,068 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43488 samples/s/p 0:34:59 } +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 201/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.6740352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:43,015 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.44149 samples/s/p 0:34:53 } +2024-07-26 00:38:45,966 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 203/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.6721572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:45,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.2% |█████████████████████████████████████████████ | 5.43310 samples/s/p 0:34:53 } +2024-07-26 00:38:48,919 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 205/ 1625], loss: 1.088, per_step_time: 1473ms, lr: 1.6702834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:48,920 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43097 samples/s/p 0:34:51 } +2024-07-26 00:38:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 207/ 1625], loss: 1.225, per_step_time: 1472ms, lr: 1.6684139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43469 samples/s/p 0:34:47 } +2024-07-26 00:38:54,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 209/ 1625], loss: 1.233, per_step_time: 1471ms, lr: 1.6665446e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:54,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43676 samples/s/p 0:34:43 } +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 211/ 1625], loss: 1.155, per_step_time: 1473ms, lr: 1.6646795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:38:57,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.42913 samples/s/p 0:34:43 } +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 213/ 1625], loss: 1.157, per_step_time: 1473ms, lr: 1.662817e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:00,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.42976 samples/s/p 0:34:40 } +2024-07-26 00:39:03,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 215/ 1625], loss: 1.086, per_step_time: 1471ms, lr: 1.6609554e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:03,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43604 samples/s/p 0:34:35 } +2024-07-26 00:39:06,626 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 217/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.659098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:06,627 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43999 samples/s/p 0:34:30 } +2024-07-26 00:39:09,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 219/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.6572433e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:09,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.3% |█████████████████████████████████████████████ | 5.43584 samples/s/p 0:34:29 } +2024-07-26 00:39:12,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 221/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.6553886e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:12,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43252 samples/s/p 0:34:27 } +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 223/ 1625], loss: 1.200, per_step_time: 1471ms, lr: 1.6535391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:15,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43497 samples/s/p 0:34:23 } +2024-07-26 00:39:18,427 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 225/ 1625], loss: 1.194, per_step_time: 1470ms, lr: 1.6516913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:18,428 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.44158 samples/s/p 0:34:18 } +2024-07-26 00:39:21,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 227/ 1625], loss: 1.090, per_step_time: 1473ms, lr: 1.6498452e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:21,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.42947 samples/s/p 0:34:19 } +2024-07-26 00:39:24,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 229/ 1625], loss: 1.369, per_step_time: 1471ms, lr: 1.6480035e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:24,332 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43670 samples/s/p 0:34:14 } +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 231/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.6461626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:27,283 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43364 samples/s/p 0:34:12 } +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 233/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.644326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:30,234 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43440 samples/s/p 0:34:09 } +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 235/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.6424902e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:33,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.4% |█████████████████████████████████████████████ | 5.43894 samples/s/p 0:34:04 } +2024-07-26 00:39:36,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 237/ 1625], loss: 1.055, per_step_time: 1472ms, lr: 1.6406572e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:36,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43357 samples/s/p 0:34:03 } +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 239/ 1625], loss: 1.005, per_step_time: 1470ms, lr: 1.6388275e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:39,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43866 samples/s/p 0:33:58 } +2024-07-26 00:39:42,032 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 241/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.6369995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:42,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43812 samples/s/p 0:33:55 } +2024-07-26 00:39:44,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 243/ 1625], loss: 1.248, per_step_time: 1471ms, lr: 1.6351751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:44,984 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43492 samples/s/p 0:33:54 } +2024-07-26 00:39:47,932 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 245/ 1625], loss: 1.161, per_step_time: 1470ms, lr: 1.6333532e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:47,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43958 samples/s/p 0:33:49 } +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 247/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.6315331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:50,881 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43927 samples/s/p 0:33:46 } +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 249/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.6297164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:53,833 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43228 samples/s/p 0:33:46 } +2024-07-26 00:39:56,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 251/ 1625], loss: 1.268, per_step_time: 1473ms, lr: 1.6279023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:56,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.5% |█████████████████████████████████████████████ | 5.43016 samples/s/p 0:33:44 } +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 253/ 1625], loss: 0.906, per_step_time: 1472ms, lr: 1.626089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:39:59,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43168 samples/s/p 0:33:40 } +2024-07-26 00:40:02,692 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 255/ 1625], loss: 1.126, per_step_time: 1473ms, lr: 1.6242784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:02,693 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43036 samples/s/p 0:33:38 } +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 257/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.6224739e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:05,643 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43563 samples/s/p 0:33:33 } +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 259/ 1625], loss: 1.244, per_step_time: 1471ms, lr: 1.6206675e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:08,593 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43629 samples/s/p 0:33:30 } +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 261/ 1625], loss: 1.264, per_step_time: 1471ms, lr: 1.618868e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:11,543 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43681 samples/s/p 0:33:27 } +2024-07-26 00:40:14,492 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 263/ 1625], loss: 1.138, per_step_time: 1471ms, lr: 1.6170687e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:14,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43709 samples/s/p 0:33:24 } +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 265/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.6152701e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:17,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43714 samples/s/p 0:33:21 } +2024-07-26 00:40:20,390 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 267/ 1625], loss: 1.176, per_step_time: 1470ms, lr: 1.6134777e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:20,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.6% |█████████████████████████████████████████████ | 5.43928 samples/s/p 0:33:17 } +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 269/ 1625], loss: 1.140, per_step_time: 1471ms, lr: 1.611686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:23,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43687 samples/s/p 0:33:15 } +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 271/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.609897e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:26,292 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43333 samples/s/p 0:33:13 } +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 273/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.6081106e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:29,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43326 samples/s/p 0:33:10 } +2024-07-26 00:40:32,193 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 275/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.6063259e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:32,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43681 samples/s/p 0:33:06 } +2024-07-26 00:40:35,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 277/ 1625], loss: 1.119, per_step_time: 1470ms, lr: 1.6045447e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:35,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43990 samples/s/p 0:33:02 } +2024-07-26 00:40:38,089 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 279/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.6027659e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:38,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44016 samples/s/p 0:32:59 } +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 281/ 1625], loss: 1.128, per_step_time: 1470ms, lr: 1.6009908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:41,037 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.44131 samples/s/p 0:32:55 } +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 283/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.5992164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:43,987 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.7% |█████████████████████████████████████████████ | 5.43611 samples/s/p 0:32:54 } +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 285/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.5974456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:46,937 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43614 samples/s/p 0:32:51 } +2024-07-26 00:40:49,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 287/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.5956773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:49,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43964 samples/s/p 0:32:47 } +2024-07-26 00:40:52,838 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 289/ 1625], loss: 1.068, per_step_time: 1473ms, lr: 1.5939098e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:52,839 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43066 samples/s/p 0:32:48 } +2024-07-26 00:40:55,790 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 291/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.5921476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:55,791 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43294 samples/s/p 0:32:44 } +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 293/ 1625], loss: 1.281, per_step_time: 1470ms, lr: 1.590387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:40:58,739 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43849 samples/s/p 0:32:39 } +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 295/ 1625], loss: 1.215, per_step_time: 1470ms, lr: 1.5886292e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:01,688 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43864 samples/s/p 0:32:36 } +2024-07-26 00:41:04,639 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 297/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5868729e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:04,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.43370 samples/s/p 0:32:35 } +2024-07-26 00:41:07,593 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 299/ 1625], loss: 1.146, per_step_time: 1473ms, lr: 1.5851193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:07,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.8% |█████████████████████████████████████████████ | 5.42999 samples/s/p 0:32:33 } +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 301/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.58337e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:10,544 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43647 samples/s/p 0:32:28 } +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 303/ 1625], loss: 1.117, per_step_time: 1471ms, lr: 1.5816208e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:13,494 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43684 samples/s/p 0:32:25 } +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 305/ 1625], loss: 1.159, per_step_time: 1470ms, lr: 1.5798759e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:16,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44113 samples/s/p 0:32:20 } +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 307/ 1625], loss: 1.111, per_step_time: 1472ms, lr: 1.5781335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:19,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43466 samples/s/p 0:32:20 } +2024-07-26 00:41:22,345 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 309/ 1625], loss: 1.203, per_step_time: 1473ms, lr: 1.5763919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:22,346 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43039 samples/s/p 0:32:18 } +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 311/ 1625], loss: 0.902, per_step_time: 1470ms, lr: 1.5746565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:25,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44100 samples/s/p 0:32:11 } +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 313/ 1625], loss: 1.126, per_step_time: 1470ms, lr: 1.5729202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:28,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.44194 samples/s/p 0:32:08 } +2024-07-26 00:41:31,191 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 315/ 1625], loss: 1.332, per_step_time: 1472ms, lr: 1.5711882e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:31,192 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 91.9% |█████████████████████████████████████████████ | 5.43360 samples/s/p 0:32:08 } +2024-07-26 00:41:34,141 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 317/ 1625], loss: 1.299, per_step_time: 1471ms, lr: 1.5694588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:34,142 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43747 samples/s/p 0:32:04 } +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 319/ 1625], loss: 0.963, per_step_time: 1471ms, lr: 1.5677294e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:37,091 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43741 samples/s/p 0:32:01 } +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 321/ 1625], loss: 0.991, per_step_time: 1472ms, lr: 1.5660053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:40,042 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43458 samples/s/p 0:31:59 } +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 323/ 1625], loss: 1.289, per_step_time: 1472ms, lr: 1.5642827e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:42,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |█████████████████████████████████████████████ | 5.43215 samples/s/p 0:31:57 } +2024-07-26 00:41:45,942 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 325/ 1625], loss: 1.059, per_step_time: 1470ms, lr: 1.5625645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43955 samples/s/p 0:31:51 } +2024-07-26 00:41:48,895 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 327/ 1625], loss: 1.026, per_step_time: 1472ms, lr: 1.5608464e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:48,896 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43110 samples/s/p 0:31:51 } +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 329/ 1625], loss: 0.977, per_step_time: 1471ms, lr: 1.5591326e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:51,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43561 samples/s/p 0:31:47 } +2024-07-26 00:41:54,796 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 331/ 1625], loss: 1.156, per_step_time: 1471ms, lr: 1.5574204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:54,797 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43553 samples/s/p 0:31:44 } +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 333/ 1625], loss: 0.999, per_step_time: 1471ms, lr: 1.55571e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:41:57,746 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.0% |██████████████████████████████████████████████ | 5.43774 samples/s/p 0:31:40 } +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 335/ 1625], loss: 1.131, per_step_time: 1471ms, lr: 1.554004e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:00,697 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43501 samples/s/p 0:31:38 } +2024-07-26 00:42:03,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 337/ 1625], loss: 1.145, per_step_time: 1471ms, lr: 1.5523005e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:03,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43652 samples/s/p 0:31:35 } +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 339/ 1625], loss: 0.954, per_step_time: 1474ms, lr: 1.5505988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:06,602 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.42692 samples/s/p 0:31:35 } +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 341/ 1625], loss: 1.227, per_step_time: 1470ms, lr: 1.5488988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:09,551 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43880 samples/s/p 0:31:28 } +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 343/ 1625], loss: 1.125, per_step_time: 1470ms, lr: 1.547204e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:12,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43864 samples/s/p 0:31:25 } +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 345/ 1625], loss: 1.234, per_step_time: 1472ms, lr: 1.54551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:15,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43243 samples/s/p 0:31:24 } +2024-07-26 00:42:18,403 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 347/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.5438169e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:18,404 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43380 samples/s/p 0:31:21 } +2024-07-26 00:42:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 349/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.542129e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.1% |██████████████████████████████████████████████ | 5.43276 samples/s/p 0:31:18 } +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 351/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.5404419e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:24,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43198 samples/s/p 0:31:16 } +2024-07-26 00:42:27,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 353/ 1625], loss: 1.087, per_step_time: 1471ms, lr: 1.5387584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:27,259 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43492 samples/s/p 0:31:12 } +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 355/ 1625], loss: 1.206, per_step_time: 1473ms, lr: 1.5370773e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:30,212 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43047 samples/s/p 0:31:10 } +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 357/ 1625], loss: 1.248, per_step_time: 1470ms, lr: 1.535399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:33,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.44171 samples/s/p 0:31:04 } +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 359/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.5337239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:36,108 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43821 samples/s/p 0:31:02 } +2024-07-26 00:42:39,058 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 361/ 1625], loss: 1.217, per_step_time: 1471ms, lr: 1.5320508e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:39,059 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43578 samples/s/p 0:31:00 } +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 363/ 1625], loss: 1.280, per_step_time: 1471ms, lr: 1.5303801e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:42,008 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.43795 samples/s/p 0:30:56 } +2024-07-26 00:42:44,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 365/ 1625], loss: 1.150, per_step_time: 1474ms, lr: 1.5287121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:44,964 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.2% |██████████████████████████████████████████████ | 5.42529 samples/s/p 0:30:57 } +2024-07-26 00:42:47,915 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 367/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.5270457e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:47,916 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43333 samples/s/p 0:30:52 } +2024-07-26 00:42:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 369/ 1625], loss: 1.179, per_step_time: 1471ms, lr: 1.5253838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43579 samples/s/p 0:30:48 } +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 371/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.5237226e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:53,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43547 samples/s/p 0:30:45 } +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 373/ 1625], loss: 1.151, per_step_time: 1472ms, lr: 1.5220651e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:56,768 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43319 samples/s/p 0:30:43 } +2024-07-26 00:42:59,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 375/ 1625], loss: 1.138, per_step_time: 1472ms, lr: 1.5204091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:42:59,720 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43313 samples/s/p 0:30:40 } +2024-07-26 00:43:02,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 377/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.5187566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:02,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43166 samples/s/p 0:30:38 } +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 379/ 1625], loss: 1.029, per_step_time: 1471ms, lr: 1.5171067e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:05,622 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.43687 samples/s/p 0:30:33 } +2024-07-26 00:43:08,569 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 381/ 1625], loss: 1.298, per_step_time: 1470ms, lr: 1.5154585e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:08,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.3% |██████████████████████████████████████████████ | 5.44114 samples/s/p 0:30:29 } +2024-07-26 00:43:11,523 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 383/ 1625], loss: 1.195, per_step_time: 1473ms, lr: 1.5138147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43000 samples/s/p 0:30:29 } +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 385/ 1625], loss: 1.089, per_step_time: 1470ms, lr: 1.5121725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:14,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.44084 samples/s/p 0:30:23 } +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 387/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.5105331e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:17,423 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43223 samples/s/p 0:30:23 } +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 389/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.5088945e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43270 samples/s/p 0:30:20 } +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 391/ 1625], loss: 0.913, per_step_time: 1471ms, lr: 1.5072601e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:23,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43485 samples/s/p 0:30:16 } +2024-07-26 00:43:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 393/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.5056283e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43715 samples/s/p 0:30:12 } +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 395/ 1625], loss: 1.270, per_step_time: 1470ms, lr: 1.5039984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:29,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.43875 samples/s/p 0:30:09 } +2024-07-26 00:43:32,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 397/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.5023718e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:32,182 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.4% |██████████████████████████████████████████████ | 5.42417 samples/s/p 0:30:11 } +2024-07-26 00:43:35,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 399/ 1625], loss: 1.103, per_step_time: 1470ms, lr: 1.5007479e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:35,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43909 samples/s/p 0:30:03 } +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 401/ 1625], loss: 1.182, per_step_time: 1471ms, lr: 1.4991265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:38,081 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43534 samples/s/p 0:30:01 } +2024-07-26 00:43:41,031 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 403/ 1625], loss: 1.038, per_step_time: 1471ms, lr: 1.4975077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:41,032 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43505 samples/s/p 0:29:58 } +2024-07-26 00:43:43,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 405/ 1625], loss: 1.083, per_step_time: 1471ms, lr: 1.4958907e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:43,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43776 samples/s/p 0:29:54 } +2024-07-26 00:43:46,930 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 407/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.4942771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:46,931 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43817 samples/s/p 0:29:51 } +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 409/ 1625], loss: 1.046, per_step_time: 1470ms, lr: 1.4926661e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:49,879 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43908 samples/s/p 0:29:48 } +2024-07-26 00:43:52,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 411/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.4910568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:52,829 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43763 samples/s/p 0:29:46 } +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 413/ 1625], loss: 1.216, per_step_time: 1470ms, lr: 1.489451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:55,777 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.5% |██████████████████████████████████████████████ | 5.43886 samples/s/p 0:29:42 } +2024-07-26 00:43:58,729 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 415/ 1625], loss: 1.257, per_step_time: 1472ms, lr: 1.4878469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:43:58,730 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43181 samples/s/p 0:29:42 } +2024-07-26 00:44:01,677 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 417/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.4862454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:01,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44053 samples/s/p 0:29:36 } +2024-07-26 00:44:04,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 419/ 1625], loss: 1.162, per_step_time: 1471ms, lr: 1.4846482e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:04,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43747 samples/s/p 0:29:34 } +2024-07-26 00:44:07,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 421/ 1625], loss: 1.137, per_step_time: 1471ms, lr: 1.4830528e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:07,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43809 samples/s/p 0:29:31 } +2024-07-26 00:44:10,527 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 423/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.4814591e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:10,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43455 samples/s/p 0:29:29 } +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 425/ 1625], loss: 1.126, per_step_time: 1469ms, lr: 1.4798671e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:13,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.44489 samples/s/p 0:29:23 } +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 427/ 1625], loss: 1.106, per_step_time: 1471ms, lr: 1.4782795e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:16,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43517 samples/s/p 0:29:23 } +2024-07-26 00:44:19,374 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 429/ 1625], loss: 1.321, per_step_time: 1471ms, lr: 1.4766936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:19,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.6% |██████████████████████████████████████████████ | 5.43535 samples/s/p 0:29:20 } +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 431/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.475112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:22,326 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43360 samples/s/p 0:29:17 } +2024-07-26 00:44:25,278 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 433/ 1625], loss: 1.153, per_step_time: 1472ms, lr: 1.4735303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:25,278 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43182 samples/s/p 0:29:15 } +2024-07-26 00:44:28,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 435/ 1625], loss: 1.213, per_step_time: 1472ms, lr: 1.471953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:28,230 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43388 samples/s/p 0:29:11 } +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 437/ 1625], loss: 1.232, per_step_time: 1473ms, lr: 1.4703784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:31,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43061 samples/s/p 0:29:10 } +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 439/ 1625], loss: 1.077, per_step_time: 1473ms, lr: 1.4688054e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:34,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.42964 samples/s/p 0:29:07 } +2024-07-26 00:44:37,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 441/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.4672358e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:37,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43697 samples/s/p 0:29:02 } +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 443/ 1625], loss: 1.231, per_step_time: 1473ms, lr: 1.4656689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:40,040 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43017 samples/s/p 0:29:01 } +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 445/ 1625], loss: 1.142, per_step_time: 1473ms, lr: 1.4641038e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:42,993 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.7% |██████████████████████████████████████████████ | 5.43028 samples/s/p 0:28:58 } +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.4625411e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:45,943 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43644 samples/s/p 0:28:53 } +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 449/ 1625], loss: 1.108, per_step_time: 1471ms, lr: 1.4609811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:48,893 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43698 samples/s/p 0:28:50 } +2024-07-26 00:44:51,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 451/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.4594247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:51,845 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43318 samples/s/p 0:28:48 } +2024-07-26 00:44:54,797 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 453/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.4578698e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:54,798 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43117 samples/s/p 0:28:46 } +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 455/ 1625], loss: 1.253, per_step_time: 1472ms, lr: 1.4563193e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:44:57,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43221 samples/s/p 0:28:43 } +2024-07-26 00:45:00,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 457/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.4547705e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:00,701 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43557 samples/s/p 0:28:39 } +2024-07-26 00:45:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 459/ 1625], loss: 1.132, per_step_time: 1474ms, lr: 1.4532227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:03,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.42483 samples/s/p 0:28:39 } +2024-07-26 00:45:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 461/ 1625], loss: 1.230, per_step_time: 1471ms, lr: 1.451679e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:06,607 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43819 samples/s/p 0:28:32 } +2024-07-26 00:45:09,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 463/ 1625], loss: 1.205, per_step_time: 1471ms, lr: 1.4501372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:09,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.8% |██████████████████████████████████████████████ | 5.43811 samples/s/p 0:28:29 } +2024-07-26 00:45:12,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 465/ 1625], loss: 1.068, per_step_time: 1470ms, lr: 1.4485988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:12,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43863 samples/s/p 0:28:26 } +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 467/ 1625], loss: 1.200, per_step_time: 1472ms, lr: 1.447063e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43447 samples/s/p 0:28:24 } +2024-07-26 00:45:18,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 469/ 1625], loss: 0.997, per_step_time: 1469ms, lr: 1.4455297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:18,403 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44262 samples/s/p 0:28:19 } +2024-07-26 00:45:21,355 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 471/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4439984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:21,356 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43116 samples/s/p 0:28:19 } +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 473/ 1625], loss: 1.298, per_step_time: 1469ms, lr: 1.4424686e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:24,301 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44456 samples/s/p 0:28:12 } +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 475/ 1625], loss: 1.244, per_step_time: 1472ms, lr: 1.4409432e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:27,253 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43221 samples/s/p 0:28:13 } +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 477/ 1625], loss: 1.009, per_step_time: 1472ms, lr: 1.4394203e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:30,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.43438 samples/s/p 0:28:09 } +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 479/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.4378983e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:33,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 92.9% |██████████████████████████████████████████████ | 5.44072 samples/s/p 0:28:05 } +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 481/ 1625], loss: 1.021, per_step_time: 1472ms, lr: 1.4363816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:36,103 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43459 samples/s/p 0:28:04 } +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 483/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.4348656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:39,052 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43793 samples/s/p 0:28:00 } +2024-07-26 00:45:42,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 485/ 1625], loss: 1.228, per_step_time: 1473ms, lr: 1.433354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:42,006 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.42975 samples/s/p 0:27:59 } +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 487/ 1625], loss: 1.170, per_step_time: 1470ms, lr: 1.4318424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:44,954 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43942 samples/s/p 0:27:53 } +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 489/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.4303342e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:47,903 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43917 samples/s/p 0:27:50 } +2024-07-26 00:45:50,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 491/ 1625], loss: 1.108, per_step_time: 1477ms, lr: 1.4288304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:50,866 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.41350 samples/s/p 0:27:55 } +2024-07-26 00:45:53,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 493/ 1625], loss: 1.139, per_step_time: 1472ms, lr: 1.4273274e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:53,818 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.43115 samples/s/p 0:27:47 } +2024-07-26 00:45:56,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 495/ 1625], loss: 1.028, per_step_time: 1470ms, lr: 1.4258262e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:56,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.0% |██████████████████████████████████████████████ | 5.44182 samples/s/p 0:27:41 } +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 497/ 1625], loss: 1.102, per_step_time: 1471ms, lr: 1.4243302e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:45:59,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43757 samples/s/p 0:27:39 } +2024-07-26 00:46:02,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 499/ 1625], loss: 1.288, per_step_time: 1471ms, lr: 1.4228359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:02,666 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43495 samples/s/p 0:27:37 } +2024-07-26 00:46:05,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 501/ 1625], loss: 1.102, per_step_time: 1475ms, lr: 1.4213441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:05,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.42132 samples/s/p 0:27:38 } +2024-07-26 00:46:08,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 503/ 1625], loss: 1.304, per_step_time: 1471ms, lr: 1.4198541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:08,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43492 samples/s/p 0:27:31 } +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 505/ 1625], loss: 0.921, per_step_time: 1471ms, lr: 1.4183668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:11,524 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43767 samples/s/p 0:27:27 } +2024-07-26 00:46:14,475 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 507/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.4168819e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:14,476 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43429 samples/s/p 0:27:25 } +2024-07-26 00:46:17,424 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 509/ 1625], loss: 1.270, per_step_time: 1471ms, lr: 1.4154006e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:17,425 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43808 samples/s/p 0:27:21 } +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 511/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.4139218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:20,375 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.1% |██████████████████████████████████████████████ | 5.43612 samples/s/p 0:27:19 } +2024-07-26 00:46:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 513/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.4124456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43347 samples/s/p 0:27:17 } +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 515/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.4109712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:26,276 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43667 samples/s/p 0:27:13 } +2024-07-26 00:46:29,228 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 517/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.4094985e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:29,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43162 samples/s/p 0:27:11 } +2024-07-26 00:46:32,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 519/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.4080318e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:32,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42533 samples/s/p 0:27:10 } +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 521/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.4065643e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:35,138 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43042 samples/s/p 0:27:06 } +2024-07-26 00:46:38,093 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 523/ 1625], loss: 1.083, per_step_time: 1474ms, lr: 1.405102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:38,094 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.42654 samples/s/p 0:27:04 } +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 525/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.4036414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:41,045 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43394 samples/s/p 0:26:59 } +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 527/ 1625], loss: 1.143, per_step_time: 1471ms, lr: 1.4021816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:43,994 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.2% |██████████████████████████████████████████████ | 5.43777 samples/s/p 0:26:55 } +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 529/ 1625], loss: 1.156, per_step_time: 1469ms, lr: 1.4007279e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:46,941 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.44252 samples/s/p 0:26:51 } +2024-07-26 00:46:49,890 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 531/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.3992742e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:49,891 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43804 samples/s/p 0:26:49 } +2024-07-26 00:46:52,842 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 533/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.3978214e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:52,843 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43285 samples/s/p 0:26:47 } +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 535/ 1625], loss: 1.363, per_step_time: 1471ms, lr: 1.3963754e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:55,792 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43722 samples/s/p 0:26:43 } +2024-07-26 00:46:58,741 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 537/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.3949305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:46:58,742 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43803 samples/s/p 0:26:40 } +2024-07-26 00:47:01,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 539/ 1625], loss: 1.112, per_step_time: 1474ms, lr: 1.3934862e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:01,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.42633 samples/s/p 0:26:41 } +2024-07-26 00:47:04,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 541/ 1625], loss: 1.221, per_step_time: 1470ms, lr: 1.3920463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:04,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43848 samples/s/p 0:26:34 } +2024-07-26 00:47:07,602 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 543/ 1625], loss: 1.084, per_step_time: 1471ms, lr: 1.3906099e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.3% |██████████████████████████████████████████████ | 5.43779 samples/s/p 0:26:31 } +2024-07-26 00:47:10,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 545/ 1625], loss: 1.096, per_step_time: 1471ms, lr: 1.3891744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:10,554 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43493 samples/s/p 0:26:29 } +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 547/ 1625], loss: 0.980, per_step_time: 1469ms, lr: 1.3877423e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:13,500 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.44235 samples/s/p 0:26:24 } +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 549/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.3863128e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:16,450 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43635 samples/s/p 0:26:23 } +2024-07-26 00:47:19,400 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 551/ 1625], loss: 1.289, per_step_time: 1471ms, lr: 1.3848859e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:19,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43699 samples/s/p 0:26:20 } +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 553/ 1625], loss: 1.176, per_step_time: 1471ms, lr: 1.3834616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:22,350 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43726 samples/s/p 0:26:17 } +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 555/ 1625], loss: 1.063, per_step_time: 1472ms, lr: 1.3820398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:25,302 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43224 samples/s/p 0:26:15 } +2024-07-26 00:47:28,251 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 557/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3806199e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:28,252 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43729 samples/s/p 0:26:11 } +2024-07-26 00:47:31,203 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 559/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.3792041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:31,204 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.4% |██████████████████████████████████████████████ | 5.43290 samples/s/p 0:26:09 } +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 561/ 1625], loss: 1.045, per_step_time: 1469ms, lr: 1.3777885e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:34,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44448 samples/s/p 0:26:03 } +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 563/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3763797e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:37,100 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43471 samples/s/p 0:26:03 } +2024-07-26 00:47:40,052 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 565/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 1.3749693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:40,053 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43246 samples/s/p 0:26:00 } +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 567/ 1625], loss: 1.047, per_step_time: 1472ms, lr: 1.3735623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:43,005 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43171 samples/s/p 0:25:58 } +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 569/ 1625], loss: 1.239, per_step_time: 1471ms, lr: 1.3721605e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:45,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43617 samples/s/p 0:25:54 } +2024-07-26 00:47:48,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 571/ 1625], loss: 1.058, per_step_time: 1471ms, lr: 1.3707577e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:48,905 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.43743 samples/s/p 0:25:50 } +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 573/ 1625], loss: 1.178, per_step_time: 1470ms, lr: 1.3693602e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:51,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.44061 samples/s/p 0:25:46 } +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 575/ 1625], loss: 1.280, per_step_time: 1473ms, lr: 1.3679644e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:54,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.5% |██████████████████████████████████████████████ | 5.42921 samples/s/p 0:25:47 } +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 577/ 1625], loss: 0.987, per_step_time: 1472ms, lr: 1.3665704e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:47:57,757 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43454 samples/s/p 0:25:42 } +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 579/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.3651814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:00,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44059 samples/s/p 0:25:38 } +2024-07-26 00:48:03,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 581/ 1625], loss: 1.156, per_step_time: 1472ms, lr: 1.3637925e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:03,656 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43466 samples/s/p 0:25:36 } +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 583/ 1625], loss: 1.216, per_step_time: 1471ms, lr: 1.362408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:06,606 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43643 samples/s/p 0:25:33 } +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 585/ 1625], loss: 0.924, per_step_time: 1469ms, lr: 1.3610252e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:09,552 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.44375 samples/s/p 0:25:28 } +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 587/ 1625], loss: 1.157, per_step_time: 1471ms, lr: 1.3596441e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:12,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43694 samples/s/p 0:25:27 } +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 589/ 1625], loss: 1.097, per_step_time: 1473ms, lr: 1.3582674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:15,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42972 samples/s/p 0:25:26 } +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 591/ 1625], loss: 1.248, per_step_time: 1475ms, lr: 1.3568914e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:18,413 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.42369 samples/s/p 0:25:25 } +2024-07-26 00:48:21,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 593/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.355519e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:21,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.6% |██████████████████████████████████████████████ | 5.43727 samples/s/p 0:25:18 } +2024-07-26 00:48:24,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 595/ 1625], loss: 1.040, per_step_time: 1473ms, lr: 1.35415e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:24,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42873 samples/s/p 0:25:17 } +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 597/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.3527826e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:27,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43186 samples/s/p 0:25:14 } +2024-07-26 00:48:30,224 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 599/ 1625], loss: 1.216, per_step_time: 1474ms, lr: 1.3514189e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:30,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.42673 samples/s/p 0:25:12 } +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 601/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.3500568e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:33,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43551 samples/s/p 0:25:07 } +2024-07-26 00:48:36,126 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 603/ 1625], loss: 1.080, per_step_time: 1472ms, lr: 1.3486964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:36,127 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43371 samples/s/p 0:25:04 } +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 605/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.3473405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:39,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43635 samples/s/p 0:25:01 } +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 607/ 1625], loss: 1.273, per_step_time: 1470ms, lr: 1.3459869e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:42,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.44086 samples/s/p 0:24:56 } +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 609/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.3446352e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:44,975 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.7% |██████████████████████████████████████████████ | 5.43644 samples/s/p 0:24:55 } +2024-07-26 00:48:47,928 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 611/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.343287e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:47,929 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43019 samples/s/p 0:24:53 } +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 613/ 1625], loss: 1.014, per_step_time: 1470ms, lr: 1.3419404e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:50,875 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.44218 samples/s/p 0:24:47 } +2024-07-26 00:48:53,824 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 615/ 1625], loss: 1.061, per_step_time: 1471ms, lr: 1.3405966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:53,825 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43767 samples/s/p 0:24:45 } +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 617/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.3392552e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:56,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43831 samples/s/p 0:24:42 } +2024-07-26 00:48:59,726 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 619/ 1625], loss: 1.299, per_step_time: 1472ms, lr: 1.3379181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:48:59,727 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43226 samples/s/p 0:24:41 } +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 621/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.3365811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:02,678 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43332 samples/s/p 0:24:38 } +2024-07-26 00:49:05,628 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 623/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.3352493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:05,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43532 samples/s/p 0:24:34 } +2024-07-26 00:49:08,577 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 625/ 1625], loss: 1.102, per_step_time: 1470ms, lr: 1.3339184e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:08,578 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.8% |██████████████████████████████████████████████ | 5.43862 samples/s/p 0:24:30 } +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 627/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.3325899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:11,528 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43550 samples/s/p 0:24:28 } +2024-07-26 00:49:14,474 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 629/ 1625], loss: 1.174, per_step_time: 1469ms, lr: 1.331265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:14,475 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.44283 samples/s/p 0:24:23 } +2024-07-26 00:49:17,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 631/ 1625], loss: 1.140, per_step_time: 1472ms, lr: 1.3299427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:17,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43439 samples/s/p 0:24:23 } +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 633/ 1625], loss: 1.240, per_step_time: 1471ms, lr: 1.3286221e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:20,376 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43532 samples/s/p 0:24:20 } +2024-07-26 00:49:23,326 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 635/ 1625], loss: 1.186, per_step_time: 1471ms, lr: 1.3273041e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:23,327 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43605 samples/s/p 0:24:16 } +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 637/ 1625], loss: 1.121, per_step_time: 1470ms, lr: 1.3259904e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:26,275 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43911 samples/s/p 0:24:13 } +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 639/ 1625], loss: 1.079, per_step_time: 1470ms, lr: 1.3246776e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:29,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43999 samples/s/p 0:24:10 } +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 641/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.3233682e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:32,175 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 93.9% |██████████████████████████████████████████████ | 5.43266 samples/s/p 0:24:09 } +2024-07-26 00:49:35,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 643/ 1625], loss: 1.094, per_step_time: 1470ms, lr: 1.3220614e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:35,123 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.44130 samples/s/p 0:24:03 } +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 645/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.3207564e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:38,074 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43359 samples/s/p 0:24:02 } +2024-07-26 00:49:41,046 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 647/ 1625], loss: 1.140, per_step_time: 1482ms, lr: 1.319454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:41,047 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.39514 samples/s/p 0:24:10 } +2024-07-26 00:49:43,998 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 649/ 1625], loss: 1.101, per_step_time: 1472ms, lr: 1.3181567e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:43,999 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |██████████████████████████████████████████████ | 5.43301 samples/s/p 0:23:57 } +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 651/ 1625], loss: 1.088, per_step_time: 1470ms, lr: 1.3168603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:46,946 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.44079 samples/s/p 0:23:52 } +2024-07-26 00:49:49,894 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 653/ 1625], loss: 1.219, per_step_time: 1470ms, lr: 1.3155657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:49,895 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43899 samples/s/p 0:23:49 } +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 655/ 1625], loss: 1.174, per_step_time: 1472ms, lr: 1.3142752e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:52,846 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.43393 samples/s/p 0:23:48 } +2024-07-26 00:49:55,800 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 657/ 1625], loss: 1.220, per_step_time: 1473ms, lr: 1.3129866e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:55,801 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.0% |███████████████████████████████████████████████ | 5.42753 samples/s/p 0:23:46 } +2024-07-26 00:49:58,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 659/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.3116988e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:49:58,754 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43154 samples/s/p 0:23:42 } +2024-07-26 00:50:01,701 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 661/ 1625], loss: 1.179, per_step_time: 1470ms, lr: 1.3104171e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:01,702 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.44015 samples/s/p 0:23:37 } +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 663/ 1625], loss: 1.039, per_step_time: 1471ms, lr: 1.3091354e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:04,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43723 samples/s/p 0:23:35 } +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 665/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.3078563e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:07,603 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43350 samples/s/p 0:23:33 } +2024-07-26 00:50:10,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 667/ 1625], loss: 1.189, per_step_time: 1472ms, lr: 1.3065833e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:10,556 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43147 samples/s/p 0:23:31 } +2024-07-26 00:50:13,505 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 669/ 1625], loss: 1.238, per_step_time: 1471ms, lr: 1.3053102e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:13,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43702 samples/s/p 0:23:26 } +2024-07-26 00:50:16,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 671/ 1625], loss: 1.032, per_step_time: 1472ms, lr: 1.3040398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:16,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43345 samples/s/p 0:23:24 } +2024-07-26 00:50:19,410 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 673/ 1625], loss: 1.191, per_step_time: 1472ms, lr: 1.302771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:19,411 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.1% |███████████████████████████████████████████████ | 5.43356 samples/s/p 0:23:21 } +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 675/ 1625], loss: 1.163, per_step_time: 1469ms, lr: 1.3015066e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:22,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.44325 samples/s/p 0:23:16 } +2024-07-26 00:50:25,313 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 677/ 1625], loss: 1.006, per_step_time: 1473ms, lr: 1.3002439e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:25,314 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42940 samples/s/p 0:23:16 } +2024-07-26 00:50:28,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 679/ 1625], loss: 1.173, per_step_time: 1472ms, lr: 1.2989838e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:28,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43133 samples/s/p 0:23:13 } +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 681/ 1625], loss: 1.322, per_step_time: 1471ms, lr: 1.2977271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:31,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43814 samples/s/p 0:23:08 } +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 683/ 1625], loss: 1.254, per_step_time: 1472ms, lr: 1.2964713e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:34,167 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43452 samples/s/p 0:23:06 } +2024-07-26 00:50:37,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 685/ 1625], loss: 1.187, per_step_time: 1471ms, lr: 1.295219e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:37,117 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43723 samples/s/p 0:23:03 } +2024-07-26 00:50:40,072 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 687/ 1625], loss: 1.003, per_step_time: 1473ms, lr: 1.2939702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:40,072 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.42807 samples/s/p 0:23:02 } +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 689/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.2927239e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:43,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.2% |███████████████████████████████████████████████ | 5.43482 samples/s/p 0:22:57 } +2024-07-26 00:50:45,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 691/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.2914802e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:45,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43628 samples/s/p 0:22:54 } +2024-07-26 00:50:48,922 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 693/ 1625], loss: 0.969, per_step_time: 1471ms, lr: 1.2902383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:48,923 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43781 samples/s/p 0:22:51 } +2024-07-26 00:50:51,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 695/ 1625], loss: 1.115, per_step_time: 1470ms, lr: 1.2889989e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:51,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44017 samples/s/p 0:22:47 } +2024-07-26 00:50:54,819 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 697/ 1625], loss: 1.107, per_step_time: 1470ms, lr: 1.2877638e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:54,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43851 samples/s/p 0:22:45 } +2024-07-26 00:50:57,771 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 699/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.2865305e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:50:57,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43420 samples/s/p 0:22:43 } +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 701/ 1625], loss: 1.247, per_step_time: 1470ms, lr: 1.2852998e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:00,719 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.44063 samples/s/p 0:22:38 } +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 703/ 1625], loss: 1.164, per_step_time: 1470ms, lr: 1.2840708e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:03,667 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43962 samples/s/p 0:22:35 } +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 705/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.2828461e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:06,618 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.3% |███████████████████████████████████████████████ | 5.43524 samples/s/p 0:22:34 } +2024-07-26 00:51:09,564 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 707/ 1625], loss: 1.046, per_step_time: 1469ms, lr: 1.2816215e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:09,565 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44252 samples/s/p 0:22:29 } +2024-07-26 00:51:12,518 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 709/ 1625], loss: 1.102, per_step_time: 1473ms, lr: 1.2804003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:12,519 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.42930 samples/s/p 0:22:29 } +2024-07-26 00:51:15,469 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 711/ 1625], loss: 1.059, per_step_time: 1472ms, lr: 1.2791834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:15,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43387 samples/s/p 0:22:25 } +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 713/ 1625], loss: 1.155, per_step_time: 1472ms, lr: 1.2779674e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:18,421 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43376 samples/s/p 0:22:22 } +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 715/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.2767548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:21,369 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.44038 samples/s/p 0:22:18 } +2024-07-26 00:51:24,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 717/ 1625], loss: 1.056, per_step_time: 1472ms, lr: 1.2755448e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:24,321 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43373 samples/s/p 0:22:16 } +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 719/ 1625], loss: 1.092, per_step_time: 1472ms, lr: 1.2743375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:27,272 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43389 samples/s/p 0:22:13 } +2024-07-26 00:51:30,221 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 721/ 1625], loss: 1.169, per_step_time: 1471ms, lr: 1.2731327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:30,222 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43700 samples/s/p 0:22:10 } +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 723/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.2719313e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:33,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.4% |███████████████████████████████████████████████ | 5.43185 samples/s/p 0:22:08 } +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 725/ 1625], loss: 1.132, per_step_time: 1470ms, lr: 1.2707309e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:36,122 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.44003 samples/s/p 0:22:03 } +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 727/ 1625], loss: 1.142, per_step_time: 1470ms, lr: 1.2695356e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:39,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43871 samples/s/p 0:22:00 } +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 729/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.2683403e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:42,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43611 samples/s/p 0:21:58 } +2024-07-26 00:51:44,973 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 731/ 1625], loss: 1.098, per_step_time: 1472ms, lr: 1.2671485e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:44,974 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43223 samples/s/p 0:21:56 } +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 733/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.2659592e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:47,925 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43354 samples/s/p 0:21:53 } +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 735/ 1625], loss: 1.027, per_step_time: 1472ms, lr: 1.2647735e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:50,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43440 samples/s/p 0:21:50 } +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 737/ 1625], loss: 1.097, per_step_time: 1472ms, lr: 1.2635894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:53,827 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43391 samples/s/p 0:21:47 } +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 739/ 1625], loss: 1.150, per_step_time: 1472ms, lr: 1.2624089e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:56,780 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.5% |███████████████████████████████████████████████ | 5.43163 samples/s/p 0:21:44 } +2024-07-26 00:51:59,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 741/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.26123e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:51:59,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43407 samples/s/p 0:21:41 } +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 743/ 1625], loss: 1.180, per_step_time: 1474ms, lr: 1.2600555e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:02,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.42537 samples/s/p 0:21:40 } +2024-07-26 00:52:05,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 745/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.258881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:05,637 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43786 samples/s/p 0:21:34 } +2024-07-26 00:52:08,588 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 747/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.2577107e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:08,588 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43456 samples/s/p 0:21:32 } +2024-07-26 00:52:11,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 749/ 1625], loss: 1.090, per_step_time: 1480ms, lr: 1.2565431e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:11,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.40217 samples/s/p 0:21:37 } +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 751/ 1625], loss: 1.059, per_step_time: 1471ms, lr: 1.255378e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:14,506 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43722 samples/s/p 0:21:25 } +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 753/ 1625], loss: 1.254, per_step_time: 1471ms, lr: 1.2542147e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:17,456 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43693 samples/s/p 0:21:23 } +2024-07-26 00:52:20,405 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 755/ 1625], loss: 1.334, per_step_time: 1471ms, lr: 1.2530548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:20,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.6% |███████████████████████████████████████████████ | 5.43690 samples/s/p 0:21:20 } +2024-07-26 00:52:23,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 757/ 1625], loss: 1.113, per_step_time: 1470ms, lr: 1.2518976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:23,354 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.44026 samples/s/p 0:21:16 } +2024-07-26 00:52:26,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 759/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.250743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:26,306 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43334 samples/s/p 0:21:15 } +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 761/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.2495917e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:29,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43186 samples/s/p 0:21:12 } +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 763/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.2484405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:32,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43432 samples/s/p 0:21:08 } +2024-07-26 00:52:35,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 765/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.2472946e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:35,160 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43718 samples/s/p 0:21:05 } +2024-07-26 00:52:38,108 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 767/ 1625], loss: 1.031, per_step_time: 1470ms, lr: 1.2461494e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:38,109 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43850 samples/s/p 0:21:02 } +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 769/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.2450085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:41,057 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43871 samples/s/p 0:20:59 } +2024-07-26 00:52:44,008 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 771/ 1625], loss: 1.252, per_step_time: 1472ms, lr: 1.2438694e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:44,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.7% |███████████████████████████████████████████████ | 5.43410 samples/s/p 0:20:57 } +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 773/ 1625], loss: 1.123, per_step_time: 1471ms, lr: 1.2427329e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:46,959 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43502 samples/s/p 0:20:54 } +2024-07-26 00:52:49,906 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 775/ 1625], loss: 1.140, per_step_time: 1470ms, lr: 1.2415982e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.44168 samples/s/p 0:20:49 } +2024-07-26 00:52:49,907 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 00:53:25,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 777/ 1625], loss: 1.305, per_step_time: 2003ms, lr: 1.2404677e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:25,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 3.99207 samples/s/p 0:28:19 } +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 779/ 1625], loss: 1.212, per_step_time: 1472ms, lr: 1.2393398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:28,859 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43394 samples/s/p 0:20:45 } +2024-07-26 00:53:31,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 781/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.2382137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:31,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43396 samples/s/p 0:20:42 } +2024-07-26 00:53:34,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 783/ 1625], loss: 1.222, per_step_time: 1471ms, lr: 1.2370901e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:34,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43539 samples/s/p 0:20:39 } +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 785/ 1625], loss: 1.023, per_step_time: 1471ms, lr: 1.2359692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:37,711 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43714 samples/s/p 0:20:35 } +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 787/ 1625], loss: 1.113, per_step_time: 1472ms, lr: 1.2348517e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:40,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.8% |███████████████████████████████████████████████ | 5.43449 samples/s/p 0:20:33 } +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 789/ 1625], loss: 1.307, per_step_time: 1473ms, lr: 1.2337359e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:43,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42959 samples/s/p 0:20:31 } +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 791/ 1625], loss: 1.160, per_step_time: 1472ms, lr: 1.2326236e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:46,567 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43465 samples/s/p 0:20:27 } +2024-07-26 00:53:49,516 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 793/ 1625], loss: 1.257, per_step_time: 1471ms, lr: 1.2315139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:49,516 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43820 samples/s/p 0:20:23 } +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 795/ 1625], loss: 1.404, per_step_time: 1470ms, lr: 1.2304059e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:52,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43863 samples/s/p 0:20:20 } +2024-07-26 00:53:55,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 797/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.2293013e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:55,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43981 samples/s/p 0:20:17 } +2024-07-26 00:53:58,362 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 799/ 1625], loss: 1.213, per_step_time: 1470ms, lr: 1.2281994e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:53:58,363 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43860 samples/s/p 0:20:15 } +2024-07-26 00:54:01,312 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 801/ 1625], loss: 1.255, per_step_time: 1471ms, lr: 1.2271009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:01,313 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.43620 samples/s/p 0:20:12 } +2024-07-26 00:54:04,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 803/ 1625], loss: 1.184, per_step_time: 1474ms, lr: 1.2260016e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:04,270 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 94.9% |███████████████████████████████████████████████ | 5.42382 samples/s/p 0:20:12 } +2024-07-26 00:54:07,216 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 805/ 1625], loss: 1.183, per_step_time: 1470ms, lr: 1.2249092e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:07,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44160 samples/s/p 0:20:05 } +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 807/ 1625], loss: 1.168, per_step_time: 1472ms, lr: 1.2238168e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:10,168 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43346 samples/s/p 0:20:04 } +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 809/ 1625], loss: 1.378, per_step_time: 1470ms, lr: 1.2227285e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:13,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44045 samples/s/p 0:19:59 } +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 811/ 1625], loss: 1.224, per_step_time: 1472ms, lr: 1.2216414e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:16,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43433 samples/s/p 0:19:58 } +2024-07-26 00:54:19,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 813/ 1625], loss: 1.160, per_step_time: 1471ms, lr: 1.2205584e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:19,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43632 samples/s/p 0:19:54 } +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 815/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.2194764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:21,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43662 samples/s/p 0:19:51 } +2024-07-26 00:54:24,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 817/ 1625], loss: 0.958, per_step_time: 1470ms, lr: 1.2183987e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:24,915 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.44089 samples/s/p 0:19:48 } +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 819/ 1625], loss: 1.142, per_step_time: 1471ms, lr: 1.2173217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:27,865 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.0% |███████████████████████████████████████████████ | 5.43538 samples/s/p 0:19:46 } +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 821/ 1625], loss: 1.135, per_step_time: 1469ms, lr: 1.2162501e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:30,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.44494 samples/s/p 0:19:41 } +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 823/ 1625], loss: 1.115, per_step_time: 1473ms, lr: 1.2151784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:33,765 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42896 samples/s/p 0:19:41 } +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 825/ 1625], loss: 1.055, per_step_time: 1473ms, lr: 1.214111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:36,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43077 samples/s/p 0:19:38 } +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 827/ 1625], loss: 1.006, per_step_time: 1475ms, lr: 1.2130454e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:39,676 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42165 samples/s/p 0:19:37 } +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 829/ 1625], loss: 1.075, per_step_time: 1470ms, lr: 1.2119832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:42,624 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43983 samples/s/p 0:19:30 } +2024-07-26 00:54:45,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 831/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.2109227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:45,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43218 samples/s/p 0:19:29 } +2024-07-26 00:54:48,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 833/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.2098657e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:48,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.43140 samples/s/p 0:19:26 } +2024-07-26 00:54:51,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 835/ 1625], loss: 0.949, per_step_time: 1475ms, lr: 1.2088104e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:51,488 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.1% |███████████████████████████████████████████████ | 5.42151 samples/s/p 0:19:25 } +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 837/ 1625], loss: 1.201, per_step_time: 1472ms, lr: 1.2077595e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:54,441 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43153 samples/s/p 0:19:20 } +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 839/ 1625], loss: 1.307, per_step_time: 1472ms, lr: 1.2067094e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:54:57,392 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43384 samples/s/p 0:19:17 } +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 841/ 1625], loss: 1.252, per_step_time: 1470ms, lr: 1.2056628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:00,340 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.44039 samples/s/p 0:19:12 } +2024-07-26 00:55:03,290 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 843/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.2046196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:03,291 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43586 samples/s/p 0:19:10 } +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 845/ 1625], loss: 1.211, per_step_time: 1472ms, lr: 1.2035764e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:06,243 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43221 samples/s/p 0:19:08 } +2024-07-26 00:55:09,195 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 847/ 1625], loss: 1.316, per_step_time: 1472ms, lr: 1.2025375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:09,196 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43253 samples/s/p 0:19:05 } +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 849/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.2015031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:12,147 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.44000 samples/s/p 0:19:01 } +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 851/ 1625], loss: 1.166, per_step_time: 1471ms, lr: 1.2004693e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:15,097 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43734 samples/s/p 0:18:58 } +2024-07-26 00:55:18,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 853/ 1625], loss: 0.971, per_step_time: 1471ms, lr: 1.1994383e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:18,049 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.2% |███████████████████████████████████████████████ | 5.43525 samples/s/p 0:18:56 } +2024-07-26 00:55:20,997 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 855/ 1625], loss: 1.100, per_step_time: 1470ms, lr: 1.198409e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:20,998 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43866 samples/s/p 0:18:52 } +2024-07-26 00:55:23,954 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 857/ 1625], loss: 1.175, per_step_time: 1475ms, lr: 1.1973831e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:23,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42313 samples/s/p 0:18:52 } +2024-07-26 00:55:26,908 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 859/ 1625], loss: 1.112, per_step_time: 1473ms, lr: 1.1963607e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:26,909 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.42956 samples/s/p 0:18:48 } +2024-07-26 00:55:29,867 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 861/ 1625], loss: 1.147, per_step_time: 1476ms, lr: 1.1953391e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:29,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.41922 samples/s/p 0:18:47 } +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 863/ 1625], loss: 1.289, per_step_time: 1470ms, lr: 1.1943227e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:32,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.44016 samples/s/p 0:18:40 } +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 865/ 1625], loss: 1.402, per_step_time: 1471ms, lr: 1.1933064e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:35,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43587 samples/s/p 0:18:38 } +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 867/ 1625], loss: 1.122, per_step_time: 1472ms, lr: 1.1922943e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:38,718 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43288 samples/s/p 0:18:36 } +2024-07-26 00:55:41,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 869/ 1625], loss: 1.012, per_step_time: 1473ms, lr: 1.1912848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:41,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.3% |███████████████████████████████████████████████ | 5.43075 samples/s/p 0:18:33 } +2024-07-26 00:55:44,625 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 871/ 1625], loss: 1.115, per_step_time: 1472ms, lr: 1.1902771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:44,625 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43153 samples/s/p 0:18:30 } +2024-07-26 00:55:47,576 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 873/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.1892737e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:47,577 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43448 samples/s/p 0:18:27 } +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 875/ 1625], loss: 1.133, per_step_time: 1472ms, lr: 1.188272e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:50,529 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43165 samples/s/p 0:18:24 } +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 877/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.1872712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:53,482 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43322 samples/s/p 0:18:21 } +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 879/ 1625], loss: 1.032, per_step_time: 1473ms, lr: 1.1862755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:56,435 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43090 samples/s/p 0:18:18 } +2024-07-26 00:55:59,386 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 881/ 1625], loss: 1.052, per_step_time: 1472ms, lr: 1.1852799e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:55:59,387 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43360 samples/s/p 0:18:15 } +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 883/ 1625], loss: 1.095, per_step_time: 1472ms, lr: 1.1842894e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:02,338 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43317 samples/s/p 0:18:12 } +2024-07-26 00:56:05,289 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 885/ 1625], loss: 1.040, per_step_time: 1472ms, lr: 1.1833007e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:05,290 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.4% |███████████████████████████████████████████████ | 5.43388 samples/s/p 0:18:09 } +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 887/ 1625], loss: 1.119, per_step_time: 1471ms, lr: 1.1823155e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:08,239 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43720 samples/s/p 0:18:05 } +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 889/ 1625], loss: 1.222, per_step_time: 1474ms, lr: 1.181332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:11,194 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42737 samples/s/p 0:18:04 } +2024-07-26 00:56:14,144 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 891/ 1625], loss: 1.057, per_step_time: 1471ms, lr: 1.180351e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:14,145 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43540 samples/s/p 0:18:00 } +2024-07-26 00:56:17,095 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 893/ 1625], loss: 1.015, per_step_time: 1472ms, lr: 1.1793726e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:17,096 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43405 samples/s/p 0:17:57 } +2024-07-26 00:56:20,050 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 895/ 1625], loss: 1.148, per_step_time: 1473ms, lr: 1.178396e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:20,051 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42768 samples/s/p 0:17:55 } +2024-07-26 00:56:23,001 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 897/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.1774246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:23,002 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43425 samples/s/p 0:17:51 } +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 899/ 1625], loss: 1.249, per_step_time: 1473ms, lr: 1.1764548e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:25,955 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.42992 samples/s/p 0:17:49 } +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 901/ 1625], loss: 1.104, per_step_time: 1470ms, lr: 1.1754878e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:28,904 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.5% |███████████████████████████████████████████████ | 5.43864 samples/s/p 0:17:44 } +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 903/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.1745224e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:31,856 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43250 samples/s/p 0:17:43 } +2024-07-26 00:56:34,810 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 905/ 1625], loss: 0.961, per_step_time: 1473ms, lr: 1.1735588e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:34,811 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43051 samples/s/p 0:17:40 } +2024-07-26 00:56:37,762 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 907/ 1625], loss: 1.132, per_step_time: 1472ms, lr: 1.1726003e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:37,763 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43259 samples/s/p 0:17:37 } +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 909/ 1625], loss: 0.983, per_step_time: 1473ms, lr: 1.1716427e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:40,717 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.42841 samples/s/p 0:17:35 } +2024-07-26 00:56:43,670 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 911/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1706876e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:43,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43089 samples/s/p 0:17:31 } +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 913/ 1625], loss: 1.013, per_step_time: 1472ms, lr: 1.169736e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:46,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43182 samples/s/p 0:17:28 } +2024-07-26 00:56:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 915/ 1625], loss: 1.259, per_step_time: 1470ms, lr: 1.168788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:49,571 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.44098 samples/s/p 0:17:23 } +2024-07-26 00:56:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 917/ 1625], loss: 1.246, per_step_time: 1471ms, lr: 1.1678408e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.6% |███████████████████████████████████████████████ | 5.43650 samples/s/p 0:17:21 } +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 919/ 1625], loss: 1.351, per_step_time: 1472ms, lr: 1.1668986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:55,473 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43291 samples/s/p 0:17:19 } +2024-07-26 00:56:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 921/ 1625], loss: 1.133, per_step_time: 1471ms, lr: 1.1659566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:56:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43596 samples/s/p 0:17:16 } +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 923/ 1625], loss: 1.024, per_step_time: 1471ms, lr: 1.1650188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:01,373 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43746 samples/s/p 0:17:12 } +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 925/ 1625], loss: 1.099, per_step_time: 1472ms, lr: 1.1640828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:04,325 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43236 samples/s/p 0:17:10 } +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 927/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.1631478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:07,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43874 samples/s/p 0:17:06 } +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 929/ 1625], loss: 1.247, per_step_time: 1473ms, lr: 1.1622195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:10,227 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43077 samples/s/p 0:17:05 } +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 931/ 1625], loss: 1.116, per_step_time: 1472ms, lr: 1.1612905e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:13,179 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43219 samples/s/p 0:17:02 } +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 933/ 1625], loss: 0.981, per_step_time: 1472ms, lr: 1.1603656e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:16,132 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.7% |███████████████████████████████████████████████ | 5.43131 samples/s/p 0:16:59 } +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 935/ 1625], loss: 1.391, per_step_time: 1475ms, lr: 1.1594426e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:19,090 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42179 samples/s/p 0:16:58 } +2024-07-26 00:57:22,040 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 937/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1585222e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43621 samples/s/p 0:16:52 } +2024-07-26 00:57:24,990 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 939/ 1625], loss: 1.020, per_step_time: 1471ms, lr: 1.1576052e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:24,991 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43587 samples/s/p 0:16:49 } +2024-07-26 00:57:27,941 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 941/ 1625], loss: 1.043, per_step_time: 1472ms, lr: 1.1566899e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:27,942 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43475 samples/s/p 0:16:46 } +2024-07-26 00:57:30,893 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 943/ 1625], loss: 1.395, per_step_time: 1472ms, lr: 1.1557781e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:30,894 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43247 samples/s/p 0:16:44 } +2024-07-26 00:57:33,847 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 945/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.1548681e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:33,848 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.42921 samples/s/p 0:16:41 } +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 947/ 1625], loss: 1.033, per_step_time: 1473ms, lr: 1.1539623e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43083 samples/s/p 0:16:38 } +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 949/ 1625], loss: 1.067, per_step_time: 1470ms, lr: 1.1530583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:39,750 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.8% |███████████████████████████████████████████████ | 5.43949 samples/s/p 0:16:34 } +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 951/ 1625], loss: 1.334, per_step_time: 1474ms, lr: 1.1521586e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:42,705 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.42728 samples/s/p 0:16:33 } +2024-07-26 00:57:45,656 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 953/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.1512581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:45,657 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43483 samples/s/p 0:16:29 } +2024-07-26 00:57:48,603 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 955/ 1625], loss: 1.356, per_step_time: 1469ms, lr: 1.1503627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:48,604 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.44252 samples/s/p 0:16:24 } +2024-07-26 00:57:51,555 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 957/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.1494699e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:51,555 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43310 samples/s/p 0:16:23 } +2024-07-26 00:57:54,506 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 959/ 1625], loss: 1.105, per_step_time: 1472ms, lr: 1.1485771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:54,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43379 samples/s/p 0:16:20 } +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 961/ 1625], loss: 1.180, per_step_time: 1473ms, lr: 1.1476903e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:57:57,460 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43098 samples/s/p 0:16:18 } +2024-07-26 00:58:00,409 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 963/ 1625], loss: 1.110, per_step_time: 1471ms, lr: 1.1468053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:00,410 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43690 samples/s/p 0:16:14 } +2024-07-26 00:58:03,360 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 965/ 1625], loss: 0.989, per_step_time: 1471ms, lr: 1.1459211e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:03,360 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 95.9% |███████████████████████████████████████████████ | 5.43502 samples/s/p 0:16:11 } +2024-07-26 00:58:06,314 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 967/ 1625], loss: 1.185, per_step_time: 1473ms, lr: 1.1450413e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:06,315 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.42862 samples/s/p 0:16:09 } +2024-07-26 00:58:09,263 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 969/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.1441632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:09,263 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43828 samples/s/p 0:16:05 } +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 971/ 1625], loss: 1.397, per_step_time: 1472ms, lr: 1.1432877e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:12,215 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43315 samples/s/p 0:16:02 } +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 973/ 1625], loss: 1.293, per_step_time: 1472ms, lr: 1.1424165e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:15,166 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |███████████████████████████████████████████████ | 5.43467 samples/s/p 0:15:59 } +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 975/ 1625], loss: 1.173, per_step_time: 1470ms, lr: 1.1415462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44053 samples/s/p 0:15:55 } +2024-07-26 00:58:21,065 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 977/ 1625], loss: 1.263, per_step_time: 1472ms, lr: 1.1406785e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:21,066 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43290 samples/s/p 0:15:54 } +2024-07-26 00:58:24,013 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 979/ 1625], loss: 1.317, per_step_time: 1470ms, lr: 1.1398151e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:24,014 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.44172 samples/s/p 0:15:49 } +2024-07-26 00:58:26,962 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 981/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 1.1389534e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:26,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43833 samples/s/p 0:15:47 } +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 983/ 1625], loss: 1.186, per_step_time: 1472ms, lr: 1.1380953e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:29,914 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.0% |████████████████████████████████████████████████ | 5.43356 samples/s/p 0:15:45 } +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 985/ 1625], loss: 1.219, per_step_time: 1471ms, lr: 1.1372379e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:32,863 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43780 samples/s/p 0:15:41 } +2024-07-26 00:58:35,815 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 987/ 1625], loss: 1.185, per_step_time: 1472ms, lr: 1.1363849e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:35,816 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43292 samples/s/p 0:15:39 } +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 989/ 1625], loss: 1.171, per_step_time: 1471ms, lr: 1.1355327e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:38,766 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43601 samples/s/p 0:15:35 } +2024-07-26 00:58:41,714 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 991/ 1625], loss: 1.498, per_step_time: 1470ms, lr: 1.1346857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:41,715 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43966 samples/s/p 0:15:32 } +2024-07-26 00:58:44,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 993/ 1625], loss: 1.065, per_step_time: 1470ms, lr: 1.1338395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:44,662 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.44166 samples/s/p 0:15:29 } +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 995/ 1625], loss: 1.396, per_step_time: 1471ms, lr: 1.1329969e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:47,611 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43782 samples/s/p 0:15:26 } +2024-07-26 00:58:50,561 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 997/ 1625], loss: 1.198, per_step_time: 1471ms, lr: 1.1321551e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:50,562 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43664 samples/s/p 0:15:24 } +2024-07-26 00:58:53,511 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 999/ 1625], loss: 1.153, per_step_time: 1471ms, lr: 1.1313176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:53,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.1% |████████████████████████████████████████████████ | 5.43611 samples/s/p 0:15:21 } +2024-07-26 00:58:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1001/ 1625], loss: 1.104, per_step_time: 1473ms, lr: 1.1304828e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:56,466 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42794 samples/s/p 0:15:19 } +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1003/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.1296487e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:58:59,417 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43467 samples/s/p 0:15:15 } +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1005/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.1288207e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:02,368 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43472 samples/s/p 0:15:12 } +2024-07-26 00:59:05,319 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1007/ 1625], loss: 1.142, per_step_time: 1472ms, lr: 1.1279928e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:05,319 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43424 samples/s/p 0:15:09 } +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1009/ 1625], loss: 1.144, per_step_time: 1471ms, lr: 1.1271692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:08,269 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43703 samples/s/p 0:15:06 } +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1011/ 1625], loss: 1.373, per_step_time: 1474ms, lr: 1.1263472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:11,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.42523 samples/s/p 0:15:05 } +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1013/ 1625], loss: 1.167, per_step_time: 1472ms, lr: 1.1255271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:14,177 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43248 samples/s/p 0:15:01 } +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1015/ 1625], loss: 1.164, per_step_time: 1472ms, lr: 1.1247112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:17,128 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.2% |████████████████████████████████████████████████ | 5.43449 samples/s/p 0:14:57 } +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1017/ 1625], loss: 1.015, per_step_time: 1470ms, lr: 1.1238961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:20,076 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44076 samples/s/p 0:14:53 } +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1019/ 1625], loss: 0.968, per_step_time: 1471ms, lr: 1.1230854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:23,025 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43841 samples/s/p 0:14:51 } +2024-07-26 00:59:25,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1021/ 1625], loss: 1.212, per_step_time: 1473ms, lr: 1.1222766e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:25,980 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42782 samples/s/p 0:14:50 } +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1023/ 1625], loss: 1.166, per_step_time: 1473ms, lr: 1.1214719e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:28,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.42805 samples/s/p 0:14:47 } +2024-07-26 00:59:31,881 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1025/ 1625], loss: 1.134, per_step_time: 1470ms, lr: 1.1206673e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:31,882 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.44089 samples/s/p 0:14:42 } +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1027/ 1625], loss: 0.967, per_step_time: 1471ms, lr: 1.119867e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:34,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43535 samples/s/p 0:14:40 } +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1029/ 1625], loss: 1.174, per_step_time: 1471ms, lr: 1.1190692e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:37,783 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43497 samples/s/p 0:14:37 } +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1031/ 1625], loss: 1.034, per_step_time: 1470ms, lr: 1.1182733e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:40,731 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.3% |████████████████████████████████████████████████ | 5.43969 samples/s/p 0:14:33 } +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1033/ 1625], loss: 1.197, per_step_time: 1471ms, lr: 1.1174816e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:43,682 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43508 samples/s/p 0:14:31 } +2024-07-26 00:59:46,627 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1035/ 1625], loss: 1.089, per_step_time: 1469ms, lr: 1.1166908e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:46,628 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44411 samples/s/p 0:14:26 } +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1037/ 1625], loss: 0.916, per_step_time: 1470ms, lr: 1.1159034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:49,575 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44142 samples/s/p 0:14:24 } +2024-07-26 00:59:52,522 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1039/ 1625], loss: 0.982, per_step_time: 1470ms, lr: 1.1151195e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:52,523 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44105 samples/s/p 0:14:21 } +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1041/ 1625], loss: 0.996, per_step_time: 1470ms, lr: 1.1143366e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:55,470 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.44108 samples/s/p 0:14:18 } +2024-07-26 00:59:58,423 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1043/ 1625], loss: 1.281, per_step_time: 1472ms, lr: 1.1135578e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 00:59:58,424 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43131 samples/s/p 0:14:17 } +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1045/ 1625], loss: 1.054, per_step_time: 1474ms, lr: 1.11278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.42721 samples/s/p 0:14:14 } +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1047/ 1625], loss: 1.175, per_step_time: 1472ms, lr: 1.1120056e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:04,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.4% |████████████████████████████████████████████████ | 5.43306 samples/s/p 0:14:11 } +2024-07-26 01:00:07,279 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1049/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.1112346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:07,279 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.44089 samples/s/p 0:14:06 } +2024-07-26 01:00:10,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1051/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.1104663e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:10,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43031 samples/s/p 0:14:05 } +2024-07-26 01:00:13,182 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1053/ 1625], loss: 1.065, per_step_time: 1471ms, lr: 1.1096997e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:13,183 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43700 samples/s/p 0:14:01 } +2024-07-26 01:00:16,134 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1055/ 1625], loss: 1.158, per_step_time: 1472ms, lr: 1.1089375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:16,135 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43235 samples/s/p 0:13:59 } +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1057/ 1625], loss: 1.181, per_step_time: 1471ms, lr: 1.108176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:19,085 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43588 samples/s/p 0:13:55 } +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1059/ 1625], loss: 1.398, per_step_time: 1474ms, lr: 1.1074172e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:22,041 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.42519 samples/s/p 0:13:54 } +2024-07-26 01:00:24,991 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1061/ 1625], loss: 1.104, per_step_time: 1471ms, lr: 1.1066627e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:24,992 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43664 samples/s/p 0:13:49 } +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1063/ 1625], loss: 1.295, per_step_time: 1472ms, lr: 1.1059082e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:27,944 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.5% |████████████████████████████████████████████████ | 5.43211 samples/s/p 0:13:47 } +2024-07-26 01:00:30,897 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1065/ 1625], loss: 1.138, per_step_time: 1473ms, lr: 1.1051579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:30,898 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42953 samples/s/p 0:13:45 } +2024-07-26 01:00:33,851 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1067/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.1044121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:33,852 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42899 samples/s/p 0:13:42 } +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1069/ 1625], loss: 1.146, per_step_time: 1471ms, lr: 1.1036655e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:36,802 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43565 samples/s/p 0:13:38 } +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1071/ 1625], loss: 0.999, per_step_time: 1472ms, lr: 1.1029247e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43412 samples/s/p 0:13:35 } +2024-07-26 01:00:42,707 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1073/ 1625], loss: 1.262, per_step_time: 1473ms, lr: 1.1021832e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:42,708 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42918 samples/s/p 0:13:33 } +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1075/ 1625], loss: 1.200, per_step_time: 1473ms, lr: 1.1014486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:45,661 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.42985 samples/s/p 0:13:30 } +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1077/ 1625], loss: 1.198, per_step_time: 1472ms, lr: 1.1007139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:48,612 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43449 samples/s/p 0:13:26 } +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1079/ 1625], loss: 1.194, per_step_time: 1472ms, lr: 1.0999811e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:51,563 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.6% |████████████████████████████████████████████████ | 5.43476 samples/s/p 0:13:23 } +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1081/ 1625], loss: 1.155, per_step_time: 1471ms, lr: 1.0992525e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:54,512 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43750 samples/s/p 0:13:20 } +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1083/ 1625], loss: 1.177, per_step_time: 1472ms, lr: 1.0985265e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:00:57,465 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43146 samples/s/p 0:13:18 } +2024-07-26 01:01:00,413 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1085/ 1625], loss: 1.108, per_step_time: 1470ms, lr: 1.0978031e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:00,414 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43911 samples/s/p 0:13:14 } +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1087/ 1625], loss: 1.120, per_step_time: 1471ms, lr: 1.0970814e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:03,364 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43521 samples/s/p 0:13:11 } +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1089/ 1625], loss: 1.148, per_step_time: 1472ms, lr: 1.0963632e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:06,316 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43325 samples/s/p 0:13:09 } +2024-07-26 01:01:09,265 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1091/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.0956476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:09,266 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43748 samples/s/p 0:13:05 } +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1093/ 1625], loss: 1.149, per_step_time: 1472ms, lr: 1.0949345e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:12,217 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43427 samples/s/p 0:13:03 } +2024-07-26 01:01:15,169 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1095/ 1625], loss: 1.128, per_step_time: 1472ms, lr: 1.094225e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:15,170 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.7% |████████████████████████████████████████████████ | 5.43134 samples/s/p 0:13:00 } +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1097/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0935163e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:18,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43382 samples/s/p 0:12:57 } +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1099/ 1625], loss: 1.011, per_step_time: 1471ms, lr: 1.0928111e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:21,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43585 samples/s/p 0:12:54 } +2024-07-26 01:01:24,022 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1101/ 1625], loss: 1.048, per_step_time: 1471ms, lr: 1.0921093e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:24,023 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43486 samples/s/p 0:12:51 } +2024-07-26 01:01:26,971 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1103/ 1625], loss: 1.265, per_step_time: 1471ms, lr: 1.0914084e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:26,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43788 samples/s/p 0:12:47 } +2024-07-26 01:01:29,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1105/ 1625], loss: 1.091, per_step_time: 1471ms, lr: 1.0907135e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:29,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43773 samples/s/p 0:12:45 } +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1107/ 1625], loss: 1.172, per_step_time: 1470ms, lr: 1.0900178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:32,869 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43944 samples/s/p 0:12:41 } +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1109/ 1625], loss: 1.027, per_step_time: 1470ms, lr: 1.0893273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:35,817 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44117 samples/s/p 0:12:38 } +2024-07-26 01:01:38,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1111/ 1625], loss: 1.075, per_step_time: 1472ms, lr: 1.0886375e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:38,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.43376 samples/s/p 0:12:36 } +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1113/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0879496e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:41,716 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.8% |████████████████████████████████████████████████ | 5.44138 samples/s/p 0:12:32 } +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1115/ 1625], loss: 1.151, per_step_time: 1470ms, lr: 1.0872668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:44,665 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43890 samples/s/p 0:12:30 } +2024-07-26 01:01:47,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1117/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0865875e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:47,616 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43547 samples/s/p 0:12:27 } +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1119/ 1625], loss: 1.302, per_step_time: 1472ms, lr: 1.0859081e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:50,568 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43142 samples/s/p 0:12:25 } +2024-07-26 01:01:53,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1121/ 1625], loss: 1.209, per_step_time: 1470ms, lr: 1.0852315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:53,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.44143 samples/s/p 0:12:20 } +2024-07-26 01:01:56,466 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1123/ 1625], loss: 0.982, per_step_time: 1472ms, lr: 1.084559e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:56,467 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43384 samples/s/p 0:12:19 } +2024-07-26 01:01:59,419 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1125/ 1625], loss: 1.136, per_step_time: 1472ms, lr: 1.0838884e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:01:59,419 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43257 samples/s/p 0:12:16 } +2024-07-26 01:02:02,369 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1127/ 1625], loss: 1.225, per_step_time: 1471ms, lr: 1.0832194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:02,370 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43547 samples/s/p 0:12:12 } +2024-07-26 01:02:05,320 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1129/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0825556e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:05,320 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 96.9% |████████████████████████████████████████████████ | 5.43552 samples/s/p 0:12:10 } +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1131/ 1625], loss: 1.022, per_step_time: 1472ms, lr: 1.0818919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:08,271 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43474 samples/s/p 0:12:07 } +2024-07-26 01:02:11,222 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1133/ 1625], loss: 1.336, per_step_time: 1472ms, lr: 1.0812325e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:11,223 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43408 samples/s/p 0:12:04 } +2024-07-26 01:02:14,170 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1135/ 1625], loss: 1.187, per_step_time: 1470ms, lr: 1.0805747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:14,171 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43956 samples/s/p 0:12:00 } +2024-07-26 01:02:17,119 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1137/ 1625], loss: 1.188, per_step_time: 1471ms, lr: 1.0799223e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:17,120 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43837 samples/s/p 0:11:57 } +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1139/ 1625], loss: 1.157, per_step_time: 1472ms, lr: 1.0792688e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:20,071 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43351 samples/s/p 0:11:55 } +2024-07-26 01:02:23,020 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1141/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.0786198e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:23,021 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43740 samples/s/p 0:11:52 } +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1143/ 1625], loss: 1.121, per_step_time: 1472ms, lr: 1.0779751e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:25,972 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43372 samples/s/p 0:11:49 } +2024-07-26 01:02:28,920 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1145/ 1625], loss: 1.147, per_step_time: 1471ms, lr: 1.0773304e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:28,921 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.0% |████████████████████████████████████████████████ | 5.43835 samples/s/p 0:11:46 } +2024-07-26 01:02:31,870 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1147/ 1625], loss: 1.207, per_step_time: 1471ms, lr: 1.076689e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:31,871 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43670 samples/s/p 0:11:43 } +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1149/ 1625], loss: 1.208, per_step_time: 1472ms, lr: 1.0760511e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:34,822 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43398 samples/s/p 0:11:40 } +2024-07-26 01:02:37,773 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1151/ 1625], loss: 1.172, per_step_time: 1472ms, lr: 1.0754143e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:37,774 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43355 samples/s/p 0:11:37 } +2024-07-26 01:02:40,721 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1153/ 1625], loss: 1.082, per_step_time: 1470ms, lr: 1.0747824e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:40,722 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43989 samples/s/p 0:11:34 } +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1155/ 1625], loss: 1.252, per_step_time: 1469ms, lr: 1.0741506e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:43,668 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.44250 samples/s/p 0:11:30 } +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1157/ 1625], loss: 1.315, per_step_time: 1471ms, lr: 1.0735232e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:46,619 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43528 samples/s/p 0:11:28 } +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1159/ 1625], loss: 1.064, per_step_time: 1472ms, lr: 1.0728984e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:49,570 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43454 samples/s/p 0:11:25 } +2024-07-26 01:02:52,520 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1161/ 1625], loss: 0.912, per_step_time: 1471ms, lr: 1.0722744e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:52,521 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.1% |████████████████████████████████████████████████ | 5.43630 samples/s/p 0:11:22 } +2024-07-26 01:02:55,470 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1163/ 1625], loss: 0.951, per_step_time: 1471ms, lr: 1.0716547e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:55,471 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43562 samples/s/p 0:11:19 } +2024-07-26 01:02:58,425 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1165/ 1625], loss: 1.276, per_step_time: 1473ms, lr: 1.0710376e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:02:58,426 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.42823 samples/s/p 0:11:17 } +2024-07-26 01:03:01,378 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1167/ 1625], loss: 1.370, per_step_time: 1472ms, lr: 1.070424e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:01,379 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43278 samples/s/p 0:11:14 } +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1169/ 1625], loss: 1.163, per_step_time: 1471ms, lr: 1.0698112e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:04,328 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43802 samples/s/p 0:11:10 } +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1171/ 1625], loss: 1.173, per_step_time: 1471ms, lr: 1.0692028e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:07,277 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43710 samples/s/p 0:11:08 } +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1173/ 1625], loss: 1.216, per_step_time: 1472ms, lr: 1.0685951e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:10,229 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43274 samples/s/p 0:11:05 } +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1175/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0679919e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:13,180 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43554 samples/s/p 0:11:02 } +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1177/ 1625], loss: 1.241, per_step_time: 1471ms, lr: 1.0673913e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:16,130 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.2% |████████████████████████████████████████████████ | 5.43599 samples/s/p 0:10:59 } +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1179/ 1625], loss: 1.011, per_step_time: 1473ms, lr: 1.0667932e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:19,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43108 samples/s/p 0:10:56 } +2024-07-26 01:03:22,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1181/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0661968e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:22,034 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43517 samples/s/p 0:10:53 } +2024-07-26 01:03:24,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1183/ 1625], loss: 1.127, per_step_time: 1470ms, lr: 1.0656022e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:24,982 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43971 samples/s/p 0:10:50 } +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1185/ 1625], loss: 1.198, per_step_time: 1473ms, lr: 1.0650127e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:27,936 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42895 samples/s/p 0:10:48 } +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1187/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0644251e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:30,889 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43171 samples/s/p 0:10:45 } +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1189/ 1625], loss: 1.031, per_step_time: 1474ms, lr: 1.0638399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:33,844 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42739 samples/s/p 0:10:42 } +2024-07-26 01:03:36,798 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1191/ 1625], loss: 0.941, per_step_time: 1473ms, lr: 1.0632566e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:36,799 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.42856 samples/s/p 0:10:39 } +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1193/ 1625], loss: 1.236, per_step_time: 1471ms, lr: 1.0626775e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:39,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.3% |████████████████████████████████████████████████ | 5.43827 samples/s/p 0:10:35 } +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1195/ 1625], loss: 1.221, per_step_time: 1472ms, lr: 1.0621011e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:42,699 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43305 samples/s/p 0:10:33 } +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1197/ 1625], loss: 1.254, per_step_time: 1470ms, lr: 1.0615246e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:45,647 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.44067 samples/s/p 0:10:29 } +2024-07-26 01:03:48,600 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1199/ 1625], loss: 1.116, per_step_time: 1473ms, lr: 1.0609533e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:48,601 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.42971 samples/s/p 0:10:27 } +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1201/ 1625], loss: 1.241, per_step_time: 1472ms, lr: 1.0603829e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:51,553 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43209 samples/s/p 0:10:24 } +2024-07-26 01:03:54,504 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1203/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0598177e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:54,505 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43367 samples/s/p 0:10:21 } +2024-07-26 01:03:57,454 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1205/ 1625], loss: 1.266, per_step_time: 1471ms, lr: 1.0592541e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:03:57,455 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43583 samples/s/p 0:10:18 } +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1207/ 1625], loss: 0.954, per_step_time: 1472ms, lr: 1.0586924e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:00,406 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43463 samples/s/p 0:10:15 } +2024-07-26 01:04:03,354 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1209/ 1625], loss: 0.949, per_step_time: 1471ms, lr: 1.0581332e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:03,355 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.4% |████████████████████████████████████████████████ | 5.43830 samples/s/p 0:10:11 } +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1211/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0575784e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:06,308 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42977 samples/s/p 0:10:09 } +2024-07-26 01:04:09,259 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1213/ 1625], loss: 1.275, per_step_time: 1472ms, lr: 1.0570244e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:09,260 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43416 samples/s/p 0:10:06 } +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1215/ 1625], loss: 1.362, per_step_time: 1471ms, lr: 1.0564738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:12,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43709 samples/s/p 0:10:03 } +2024-07-26 01:04:15,162 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1217/ 1625], loss: 1.131, per_step_time: 1473ms, lr: 1.0559268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:15,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43026 samples/s/p 0:10:01 } +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1219/ 1625], loss: 1.181, per_step_time: 1473ms, lr: 1.0553805e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:18,116 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.42970 samples/s/p 0:09:58 } +2024-07-26 01:04:21,068 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1221/ 1625], loss: 1.083, per_step_time: 1472ms, lr: 1.0548387e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:21,069 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43202 samples/s/p 0:09:54 } +2024-07-26 01:04:24,016 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1223/ 1625], loss: 1.189, per_step_time: 1470ms, lr: 1.0542967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:24,017 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.44034 samples/s/p 0:09:51 } +2024-07-26 01:04:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1225/ 1625], loss: 1.046, per_step_time: 1471ms, lr: 1.0537617e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:26,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.5% |████████████████████████████████████████████████ | 5.43498 samples/s/p 0:09:48 } +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1227/ 1625], loss: 1.196, per_step_time: 1471ms, lr: 1.0532268e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:29,918 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43544 samples/s/p 0:09:45 } +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1229/ 1625], loss: 1.172, per_step_time: 1471ms, lr: 1.0526935e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:32,868 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43658 samples/s/p 0:09:42 } +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1231/ 1625], loss: 1.192, per_step_time: 1472ms, lr: 1.0521646e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:35,820 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43277 samples/s/p 0:09:40 } +2024-07-26 01:04:38,772 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1233/ 1625], loss: 1.109, per_step_time: 1472ms, lr: 1.0516374e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:38,772 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43176 samples/s/p 0:09:37 } +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1235/ 1625], loss: 1.146, per_step_time: 1472ms, lr: 1.0511145e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:41,724 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43296 samples/s/p 0:09:34 } +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1237/ 1625], loss: 1.166, per_step_time: 1470ms, lr: 1.0505934e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:44,671 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.44214 samples/s/p 0:09:30 } +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1239/ 1625], loss: 1.200, per_step_time: 1476ms, lr: 1.0500747e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:47,630 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.41984 samples/s/p 0:09:29 } +2024-07-26 01:04:50,581 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1241/ 1625], loss: 1.154, per_step_time: 1472ms, lr: 1.0495597e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:50,582 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43413 samples/s/p 0:09:25 } +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1243/ 1625], loss: 1.115, per_step_time: 1471ms, lr: 1.0490463e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:53,531 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.6% |████████████████████████████████████████████████ | 5.43698 samples/s/p 0:09:22 } +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1245/ 1625], loss: 1.024, per_step_time: 1470ms, lr: 1.0485355e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:56,479 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44095 samples/s/p 0:09:18 } +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1247/ 1625], loss: 1.284, per_step_time: 1471ms, lr: 1.0480273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:04:59,430 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43495 samples/s/p 0:09:16 } +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1249/ 1625], loss: 1.104, per_step_time: 1472ms, lr: 1.0475218e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:02,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43219 samples/s/p 0:09:13 } +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1251/ 1625], loss: 1.355, per_step_time: 1472ms, lr: 1.0470196e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:05,334 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43346 samples/s/p 0:09:10 } +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1253/ 1625], loss: 1.130, per_step_time: 1471ms, lr: 1.0465192e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:08,284 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43634 samples/s/p 0:09:07 } +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1255/ 1625], loss: 1.096, per_step_time: 1474ms, lr: 1.0460213e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:11,240 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.42597 samples/s/p 0:09:05 } +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1257/ 1625], loss: 1.218, per_step_time: 1470ms, lr: 1.0455278e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:14,187 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.44139 samples/s/p 0:09:01 } +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1259/ 1625], loss: 1.132, per_step_time: 1471ms, lr: 1.0450344e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:17,137 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.7% |████████████████████████████████████████████████ | 5.43674 samples/s/p 0:08:58 } +2024-07-26 01:05:20,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1261/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.044546e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:20,087 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43856 samples/s/p 0:08:55 } +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1263/ 1625], loss: 1.073, per_step_time: 1472ms, lr: 1.0440604e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:23,039 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43142 samples/s/p 0:08:53 } +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1265/ 1625], loss: 0.953, per_step_time: 1471ms, lr: 1.0435755e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:25,989 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43715 samples/s/p 0:08:49 } +2024-07-26 01:05:28,937 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1267/ 1625], loss: 1.072, per_step_time: 1470ms, lr: 1.0430958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:28,938 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43973 samples/s/p 0:08:46 } +2024-07-26 01:05:31,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1269/ 1625], loss: 1.220, per_step_time: 1470ms, lr: 1.0426162e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:31,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.44032 samples/s/p 0:08:43 } +2024-07-26 01:05:34,835 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1271/ 1625], loss: 1.041, per_step_time: 1471ms, lr: 1.042139e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:34,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43669 samples/s/p 0:08:40 } +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1273/ 1625], loss: 1.123, per_step_time: 1472ms, lr: 1.0416654e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:37,788 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43245 samples/s/p 0:08:38 } +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1275/ 1625], loss: 0.948, per_step_time: 1470ms, lr: 1.0411961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:40,736 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.8% |████████████████████████████████████████████████ | 5.43924 samples/s/p 0:08:34 } +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1277/ 1625], loss: 1.135, per_step_time: 1470ms, lr: 1.0407277e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:43,683 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44201 samples/s/p 0:08:31 } +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1279/ 1625], loss: 1.178, per_step_time: 1473ms, lr: 1.0402645e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:46,636 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43095 samples/s/p 0:08:29 } +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1281/ 1625], loss: 1.083, per_step_time: 1470ms, lr: 1.0398012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:49,584 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.44042 samples/s/p 0:08:25 } +2024-07-26 01:05:52,535 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1283/ 1625], loss: 1.330, per_step_time: 1472ms, lr: 1.0393405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:52,536 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43365 samples/s/p 0:08:23 } +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1285/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0388834e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:55,487 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43435 samples/s/p 0:08:20 } +2024-07-26 01:05:58,439 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1287/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0384288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:05:58,440 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43251 samples/s/p 0:08:17 } +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1289/ 1625], loss: 1.127, per_step_time: 1472ms, lr: 1.0379767e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:01,391 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43403 samples/s/p 0:08:14 } +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1291/ 1625], loss: 1.036, per_step_time: 1472ms, lr: 1.0375273e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:04,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 97.9% |████████████████████████████████████████████████ | 5.43472 samples/s/p 0:08:11 } +2024-07-26 01:06:07,296 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1293/ 1625], loss: 1.026, per_step_time: 1473ms, lr: 1.0370796e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:07,297 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.42843 samples/s/p 0:08:09 } +2024-07-26 01:06:10,248 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1295/ 1625], loss: 1.143, per_step_time: 1472ms, lr: 1.0366372e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:10,249 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43239 samples/s/p 0:08:05 } +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1297/ 1625], loss: 1.101, per_step_time: 1471ms, lr: 1.0361964e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:13,199 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43579 samples/s/p 0:08:02 } +2024-07-26 01:06:16,148 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1299/ 1625], loss: 1.113, per_step_time: 1471ms, lr: 1.0357581e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:16,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |████████████████████████████████████████████████ | 5.43761 samples/s/p 0:07:59 } +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1301/ 1625], loss: 1.282, per_step_time: 1471ms, lr: 1.0353217e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:19,098 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43803 samples/s/p 0:07:56 } +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1303/ 1625], loss: 1.152, per_step_time: 1471ms, lr: 1.034887e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:22,048 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43627 samples/s/p 0:07:53 } +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1305/ 1625], loss: 1.177, per_step_time: 1470ms, lr: 1.0344575e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:24,996 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43995 samples/s/p 0:07:50 } +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1307/ 1625], loss: 1.227, per_step_time: 1472ms, lr: 1.0340297e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:27,948 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.0% |█████████████████████████████████████████████████ | 5.43238 samples/s/p 0:07:48 } +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1309/ 1625], loss: 1.243, per_step_time: 1473ms, lr: 1.0336053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:30,901 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43075 samples/s/p 0:07:45 } +2024-07-26 01:06:33,852 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1311/ 1625], loss: 1.137, per_step_time: 1472ms, lr: 1.0331818e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:33,853 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43429 samples/s/p 0:07:42 } +2024-07-26 01:06:36,805 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1313/ 1625], loss: 1.215, per_step_time: 1473ms, lr: 1.0327626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:36,806 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43087 samples/s/p 0:07:39 } +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1315/ 1625], loss: 1.175, per_step_time: 1470ms, lr: 1.0323444e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:39,753 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44065 samples/s/p 0:07:35 } +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1317/ 1625], loss: 1.289, per_step_time: 1469ms, lr: 1.0319303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:42,700 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44232 samples/s/p 0:07:32 } +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1319/ 1625], loss: 1.129, per_step_time: 1472ms, lr: 1.0315181e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:45,651 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43413 samples/s/p 0:07:30 } +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1321/ 1625], loss: 1.169, per_step_time: 1470ms, lr: 1.0311085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:48,599 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.44103 samples/s/p 0:07:26 } +2024-07-26 01:06:51,549 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1323/ 1625], loss: 1.139, per_step_time: 1471ms, lr: 1.0307023e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:51,550 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.1% |█████████████████████████████████████████████████ | 5.43512 samples/s/p 0:07:24 } +2024-07-26 01:06:54,501 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1325/ 1625], loss: 1.091, per_step_time: 1472ms, lr: 1.0302995e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:54,502 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43290 samples/s/p 0:07:21 } +2024-07-26 01:06:57,451 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1327/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0298976e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:06:57,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43638 samples/s/p 0:07:18 } +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1329/ 1625], loss: 1.112, per_step_time: 1471ms, lr: 1.0295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:00,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43780 samples/s/p 0:07:15 } +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1331/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0291034e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:03,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43183 samples/s/p 0:07:13 } +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1333/ 1625], loss: 1.237, per_step_time: 1472ms, lr: 1.0287101e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:06,305 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43374 samples/s/p 0:07:09 } +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1335/ 1625], loss: 1.321, per_step_time: 1472ms, lr: 1.0283194e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:09,257 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43200 samples/s/p 0:07:07 } +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1337/ 1625], loss: 1.117, per_step_time: 1472ms, lr: 1.0279323e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:12,209 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43248 samples/s/p 0:07:04 } +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1339/ 1625], loss: 1.034, per_step_time: 1471ms, lr: 1.0275477e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:15,159 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.2% |█████████████████████████████████████████████████ | 5.43642 samples/s/p 0:07:00 } +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1341/ 1625], loss: 1.299, per_step_time: 1473ms, lr: 1.0271639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:18,114 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42772 samples/s/p 0:06:58 } +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1343/ 1625], loss: 1.197, per_step_time: 1472ms, lr: 1.0267854e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:21,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43191 samples/s/p 0:06:55 } +2024-07-26 01:07:24,018 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1345/ 1625], loss: 1.215, per_step_time: 1472ms, lr: 1.0264085e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:24,019 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43310 samples/s/p 0:06:52 } +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1347/ 1625], loss: 1.188, per_step_time: 1470ms, lr: 1.0260335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:26,967 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43968 samples/s/p 0:06:48 } +2024-07-26 01:07:29,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1349/ 1625], loss: 1.021, per_step_time: 1473ms, lr: 1.0256618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:29,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42861 samples/s/p 0:06:46 } +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1351/ 1625], loss: 1.010, per_step_time: 1472ms, lr: 1.025291e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:32,874 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.43228 samples/s/p 0:06:43 } +2024-07-26 01:07:35,839 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1353/ 1625], loss: 1.098, per_step_time: 1479ms, lr: 1.0249263e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:35,840 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.40805 samples/s/p 0:06:42 } +2024-07-26 01:07:38,794 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1355/ 1625], loss: 1.032, per_step_time: 1474ms, lr: 1.0245616e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:38,795 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.3% |█████████████████████████████████████████████████ | 5.42716 samples/s/p 0:06:37 } +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1357/ 1625], loss: 1.247, per_step_time: 1472ms, lr: 1.0242012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:41,747 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43194 samples/s/p 0:06:34 } +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1359/ 1625], loss: 1.145, per_step_time: 1472ms, lr: 1.0238425e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:44,698 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43425 samples/s/p 0:06:31 } +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1361/ 1625], loss: 1.184, per_step_time: 1470ms, lr: 1.0234857e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:47,646 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43993 samples/s/p 0:06:28 } +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1363/ 1625], loss: 1.204, per_step_time: 1472ms, lr: 1.023133e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:50,598 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43383 samples/s/p 0:06:25 } +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1365/ 1625], loss: 1.208, per_step_time: 1471ms, lr: 1.022783e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:53,548 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43664 samples/s/p 0:06:22 } +2024-07-26 01:07:56,500 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1367/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0224346e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:56,501 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43208 samples/s/p 0:06:19 } +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1369/ 1625], loss: 1.112, per_step_time: 1472ms, lr: 1.0220889e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:07:59,452 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43423 samples/s/p 0:06:16 } +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1371/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.0217484e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:02,401 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43841 samples/s/p 0:06:13 } +2024-07-26 01:08:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1373/ 1625], loss: 1.199, per_step_time: 1472ms, lr: 1.0214079e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.4% |█████████████████████████████████████████████████ | 5.43319 samples/s/p 0:06:11 } +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1375/ 1625], loss: 1.065, per_step_time: 1469ms, lr: 1.0210725e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:08,299 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44282 samples/s/p 0:06:07 } +2024-07-26 01:08:11,246 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1377/ 1625], loss: 0.925, per_step_time: 1470ms, lr: 1.0207364e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:11,247 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.44094 samples/s/p 0:06:04 } +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1379/ 1625], loss: 1.088, per_step_time: 1472ms, lr: 1.0204053e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:14,198 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43431 samples/s/p 0:06:02 } +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1381/ 1625], loss: 1.201, per_step_time: 1473ms, lr: 1.0200761e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:17,152 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42909 samples/s/p 0:05:59 } +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1383/ 1625], loss: 1.464, per_step_time: 1473ms, lr: 1.0197493e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:20,107 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42762 samples/s/p 0:05:56 } +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1385/ 1625], loss: 1.312, per_step_time: 1471ms, lr: 1.0194253e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:23,056 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43796 samples/s/p 0:05:53 } +2024-07-26 01:08:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1387/ 1625], loss: 1.335, per_step_time: 1473ms, lr: 1.0191037e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:26,010 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.43054 samples/s/p 0:05:50 } +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1389/ 1625], loss: 1.240, per_step_time: 1473ms, lr: 1.0187874e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:28,963 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.5% |█████████████████████████████████████████████████ | 5.42963 samples/s/p 0:05:47 } +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1391/ 1625], loss: 1.022, per_step_time: 1470ms, lr: 1.0184702e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:31,910 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44194 samples/s/p 0:05:43 } +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1393/ 1625], loss: 1.272, per_step_time: 1473ms, lr: 1.0181583e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:34,864 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.42951 samples/s/p 0:05:41 } +2024-07-26 01:08:37,811 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1395/ 1625], loss: 1.095, per_step_time: 1470ms, lr: 1.017848e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:37,812 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.44071 samples/s/p 0:05:38 } +2024-07-26 01:08:40,761 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1397/ 1625], loss: 1.221, per_step_time: 1471ms, lr: 1.0175395e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:40,762 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43602 samples/s/p 0:05:35 } +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1399/ 1625], loss: 1.107, per_step_time: 1471ms, lr: 1.0172334e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:43,712 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43564 samples/s/p 0:05:32 } +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1401/ 1625], loss: 1.220, per_step_time: 1472ms, lr: 1.0169335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:46,664 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43305 samples/s/p 0:05:29 } +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1403/ 1625], loss: 1.159, per_step_time: 1472ms, lr: 1.0166336e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:49,615 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43447 samples/s/p 0:05:26 } +2024-07-26 01:08:52,565 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1405/ 1625], loss: 1.306, per_step_time: 1471ms, lr: 1.0163363e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:52,566 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.6% |█████████████████████████████████████████████████ | 5.43491 samples/s/p 0:05:23 } +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1407/ 1625], loss: 1.050, per_step_time: 1471ms, lr: 1.0160417e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:55,515 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43780 samples/s/p 0:05:20 } +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1409/ 1625], loss: 1.114, per_step_time: 1470ms, lr: 1.0157504e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:08:58,464 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43874 samples/s/p 0:05:17 } +2024-07-26 01:09:01,414 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1411/ 1625], loss: 1.178, per_step_time: 1471ms, lr: 1.0154608e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:01,415 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43481 samples/s/p 0:05:15 } +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1413/ 1625], loss: 1.119, per_step_time: 1472ms, lr: 1.0151748e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:04,367 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43205 samples/s/p 0:05:12 } +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1415/ 1625], loss: 1.159, per_step_time: 1471ms, lr: 1.0148922e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:07,318 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43494 samples/s/p 0:05:09 } +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1417/ 1625], loss: 1.266, per_step_time: 1474ms, lr: 1.0146105e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:10,274 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.42521 samples/s/p 0:05:06 } +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1419/ 1625], loss: 1.294, per_step_time: 1472ms, lr: 1.0143322e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:13,225 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.43466 samples/s/p 0:05:03 } +2024-07-26 01:09:16,172 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1421/ 1625], loss: 1.016, per_step_time: 1470ms, lr: 1.0140565e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:16,173 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.7% |█████████████████████████████████████████████████ | 5.44081 samples/s/p 0:04:59 } +2024-07-26 01:09:19,120 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1423/ 1625], loss: 1.138, per_step_time: 1470ms, lr: 1.0137842e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:19,121 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44043 samples/s/p 0:04:57 } +2024-07-26 01:09:22,066 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1425/ 1625], loss: 1.024, per_step_time: 1469ms, lr: 1.0135137e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:22,067 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44382 samples/s/p 0:04:53 } +2024-07-26 01:09:25,017 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1427/ 1625], loss: 1.074, per_step_time: 1472ms, lr: 1.0132458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:25,018 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43417 samples/s/p 0:04:51 } +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1429/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0129821e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:27,968 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43603 samples/s/p 0:04:48 } +2024-07-26 01:09:30,921 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1431/ 1625], loss: 1.166, per_step_time: 1472ms, lr: 1.0127186e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:30,922 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43124 samples/s/p 0:04:45 } +2024-07-26 01:09:33,869 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1433/ 1625], loss: 1.240, per_step_time: 1470ms, lr: 1.0124593e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:33,870 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.44034 samples/s/p 0:04:42 } +2024-07-26 01:09:36,818 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1435/ 1625], loss: 1.151, per_step_time: 1471ms, lr: 1.0122026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:36,819 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43782 samples/s/p 0:04:39 } +2024-07-26 01:09:39,768 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1437/ 1625], loss: 1.025, per_step_time: 1471ms, lr: 1.0119476e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:39,769 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.8% |█████████████████████████████████████████████████ | 5.43723 samples/s/p 0:04:36 } +2024-07-26 01:09:42,722 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1439/ 1625], loss: 1.149, per_step_time: 1473ms, lr: 1.0116961e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:42,723 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.42951 samples/s/p 0:04:34 } +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1441/ 1625], loss: 1.391, per_step_time: 1471ms, lr: 1.0114472e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:45,672 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43746 samples/s/p 0:04:30 } +2024-07-26 01:09:48,622 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1443/ 1625], loss: 1.154, per_step_time: 1471ms, lr: 1.0112018e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:48,623 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43535 samples/s/p 0:04:27 } +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1445/ 1625], loss: 1.161, per_step_time: 1472ms, lr: 1.010958e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:51,574 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43416 samples/s/p 0:04:24 } +2024-07-26 01:09:54,524 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1447/ 1625], loss: 1.100, per_step_time: 1471ms, lr: 1.0107178e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:54,525 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43571 samples/s/p 0:04:21 } +2024-07-26 01:09:57,476 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1449/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0104792e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:09:57,477 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43281 samples/s/p 0:04:19 } +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1451/ 1625], loss: 1.181, per_step_time: 1472ms, lr: 1.0102442e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43119 samples/s/p 0:04:16 } +2024-07-26 01:10:03,379 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1453/ 1625], loss: 1.189, per_step_time: 1471ms, lr: 1.0100108e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:03,380 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 98.9% |█████████████████████████████████████████████████ | 5.43617 samples/s/p 0:04:13 } +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1455/ 1625], loss: 0.990, per_step_time: 1470ms, lr: 1.0097809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:06,329 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43851 samples/s/p 0:04:10 } +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1457/ 1625], loss: 1.051, per_step_time: 1472ms, lr: 1.0095536e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:09,280 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43445 samples/s/p 0:04:07 } +2024-07-26 01:10:12,232 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1459/ 1625], loss: 1.238, per_step_time: 1472ms, lr: 1.0093289e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43208 samples/s/p 0:04:04 } +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1461/ 1625], loss: 1.190, per_step_time: 1470ms, lr: 1.0091077e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:15,181 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43865 samples/s/p 0:04:01 } +2024-07-26 01:10:18,132 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1463/ 1625], loss: 1.223, per_step_time: 1472ms, lr: 1.0088872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43379 samples/s/p 0:03:58 } +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1465/ 1625], loss: 1.134, per_step_time: 1471ms, lr: 1.008672e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:21,083 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43623 samples/s/p 0:03:55 } +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1467/ 1625], loss: 1.102, per_step_time: 1472ms, lr: 1.008456e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:24,035 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.43393 samples/s/p 0:03:52 } +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1469/ 1625], loss: 1.197, per_step_time: 1469ms, lr: 1.0082451e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:26,981 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.0% |█████████████████████████████████████████████████ | 5.44422 samples/s/p 0:03:49 } +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1471/ 1625], loss: 1.270, per_step_time: 1472ms, lr: 1.0080369e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:29,933 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43219 samples/s/p 0:03:46 } +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1473/ 1625], loss: 1.281, per_step_time: 1471ms, lr: 1.0078303e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:32,884 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43481 samples/s/p 0:03:43 } +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1475/ 1625], loss: 1.106, per_step_time: 1470ms, lr: 1.007628e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:35,832 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.44013 samples/s/p 0:03:40 } +2024-07-26 01:10:38,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1477/ 1625], loss: 1.105, per_step_time: 1471ms, lr: 1.0074266e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:38,782 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43775 samples/s/p 0:03:37 } +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1479/ 1625], loss: 1.086, per_step_time: 1472ms, lr: 1.0072288e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:41,734 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43149 samples/s/p 0:03:35 } +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1481/ 1625], loss: 1.242, per_step_time: 1472ms, lr: 1.0070335e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:44,687 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43115 samples/s/p 0:03:32 } +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1483/ 1625], loss: 1.175, per_step_time: 1473ms, lr: 1.0068399e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:47,640 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43012 samples/s/p 0:03:29 } +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1485/ 1625], loss: 1.272, per_step_time: 1472ms, lr: 1.0066514e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:50,592 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.1% |█████████████████████████████████████████████████ | 5.43303 samples/s/p 0:03:26 } +2024-07-26 01:10:53,544 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1487/ 1625], loss: 1.246, per_step_time: 1472ms, lr: 1.0064639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43141 samples/s/p 0:03:23 } +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1489/ 1625], loss: 1.146, per_step_time: 1470ms, lr: 1.0062789e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:56,493 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43980 samples/s/p 0:03:20 } +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1491/ 1625], loss: 1.237, per_step_time: 1471ms, lr: 1.0060966e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:10:59,442 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43757 samples/s/p 0:03:17 } +2024-07-26 01:11:02,389 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1493/ 1625], loss: 1.116, per_step_time: 1470ms, lr: 1.0059176e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:02,390 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.44172 samples/s/p 0:03:14 } +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1495/ 1625], loss: 1.282, per_step_time: 1472ms, lr: 1.0057405e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:05,342 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43146 samples/s/p 0:03:11 } +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1497/ 1625], loss: 1.090, per_step_time: 1471ms, lr: 1.0055668e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:08,293 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43508 samples/s/p 0:03:08 } +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1499/ 1625], loss: 1.235, per_step_time: 1472ms, lr: 1.0053948e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:11,244 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43391 samples/s/p 0:03:05 } +2024-07-26 01:11:14,192 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1501/ 1625], loss: 1.007, per_step_time: 1470ms, lr: 1.0052271e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:14,193 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.43934 samples/s/p 0:03:02 } +2024-07-26 01:11:17,149 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1503/ 1625], loss: 1.278, per_step_time: 1474ms, lr: 1.0050603e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:17,149 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.2% |█████████████████████████████████████████████████ | 5.42485 samples/s/p 0:02:59 } +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1505/ 1625], loss: 1.297, per_step_time: 1473ms, lr: 1.0048986e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:20,104 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42750 samples/s/p 0:02:56 } +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1507/ 1625], loss: 1.339, per_step_time: 1472ms, lr: 1.0047371e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:23,055 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43413 samples/s/p 0:02:53 } +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1509/ 1625], loss: 1.105, per_step_time: 1473ms, lr: 1.0045788e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:26,009 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.42909 samples/s/p 0:02:50 } +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1511/ 1625], loss: 1.417, per_step_time: 1472ms, lr: 1.0044242e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:28,960 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43478 samples/s/p 0:02:47 } +2024-07-26 01:11:31,907 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1513/ 1625], loss: 1.030, per_step_time: 1470ms, lr: 1.0042712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:31,908 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.44063 samples/s/p 0:02:44 } +2024-07-26 01:11:34,857 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1515/ 1625], loss: 1.305, per_step_time: 1471ms, lr: 1.00412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:34,858 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43652 samples/s/p 0:02:41 } +2024-07-26 01:11:37,806 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1517/ 1625], loss: 1.066, per_step_time: 1471ms, lr: 1.0039756e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:37,807 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43845 samples/s/p 0:02:38 } +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1519/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.0038295e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:40,756 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.3% |█████████████████████████████████████████████████ | 5.43713 samples/s/p 0:02:35 } +2024-07-26 01:11:43,705 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1521/ 1625], loss: 1.154, per_step_time: 1470ms, lr: 1.0036896e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:43,706 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43927 samples/s/p 0:02:32 } +2024-07-26 01:11:46,653 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1523/ 1625], loss: 1.315, per_step_time: 1470ms, lr: 1.0035478e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:46,654 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43983 samples/s/p 0:02:30 } +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1525/ 1625], loss: 1.016, per_step_time: 1472ms, lr: 1.0034121e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:49,605 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43414 samples/s/p 0:02:27 } +2024-07-26 01:11:52,556 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1527/ 1625], loss: 1.141, per_step_time: 1472ms, lr: 1.0032782e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:52,557 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43309 samples/s/p 0:02:24 } +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1529/ 1625], loss: 1.080, per_step_time: 1471ms, lr: 1.0031486e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:55,507 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43582 samples/s/p 0:02:21 } +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1531/ 1625], loss: 1.129, per_step_time: 1471ms, lr: 1.0030188e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:11:58,457 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43589 samples/s/p 0:02:18 } +2024-07-26 01:12:01,407 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1533/ 1625], loss: 1.049, per_step_time: 1471ms, lr: 1.0028936e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:01,408 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.43557 samples/s/p 0:02:15 } +2024-07-26 01:12:04,364 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1535/ 1625], loss: 1.300, per_step_time: 1473ms, lr: 1.0027709e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:04,365 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.4% |█████████████████████████████████████████████████ | 5.42908 samples/s/p 0:02:12 } +2024-07-26 01:12:07,316 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1537/ 1625], loss: 1.136, per_step_time: 1471ms, lr: 1.0026498e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:07,317 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43785 samples/s/p 0:02:09 } +2024-07-26 01:12:10,266 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1539/ 1625], loss: 1.204, per_step_time: 1471ms, lr: 1.0025315e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:10,267 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43703 samples/s/p 0:02:06 } +2024-07-26 01:12:13,215 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1541/ 1625], loss: 1.162, per_step_time: 1470ms, lr: 1.0024182e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:13,216 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43911 samples/s/p 0:02:03 } +2024-07-26 01:12:16,173 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1543/ 1625], loss: 1.210, per_step_time: 1475ms, lr: 1.0023033e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:16,174 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.42179 samples/s/p 0:02:00 } +2024-07-26 01:12:19,124 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1545/ 1625], loss: 1.089, per_step_time: 1472ms, lr: 1.0021944e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:19,125 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43462 samples/s/p 0:01:57 } +2024-07-26 01:12:22,076 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1547/ 1625], loss: 1.061, per_step_time: 1472ms, lr: 1.0020872e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:22,077 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43210 samples/s/p 0:01:54 } +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1549/ 1625], loss: 1.196, per_step_time: 1472ms, lr: 1.0019844e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:25,028 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43460 samples/s/p 0:01:51 } +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1551/ 1625], loss: 1.120, per_step_time: 1472ms, lr: 1.0018815e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:27,979 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.5% |█████████████████████████████████████████████████ | 5.43423 samples/s/p 0:01:48 } +2024-07-26 01:12:30,927 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1553/ 1625], loss: 1.234, per_step_time: 1470ms, lr: 1.0017839e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:30,928 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43935 samples/s/p 0:01:45 } +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1555/ 1625], loss: 1.012, per_step_time: 1470ms, lr: 1.0016853e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:33,876 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43926 samples/s/p 0:01:42 } +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1557/ 1625], loss: 1.131, per_step_time: 1472ms, lr: 1.0015929e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:36,828 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43326 samples/s/p 0:01:40 } +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1559/ 1625], loss: 1.304, per_step_time: 1473ms, lr: 1.0015021e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:39,781 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43013 samples/s/p 0:01:37 } +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1561/ 1625], loss: 1.253, per_step_time: 1469ms, lr: 1.0014131e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:42,728 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.44251 samples/s/p 0:01:34 } +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1563/ 1625], loss: 1.060, per_step_time: 1472ms, lr: 1.0013284e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:45,679 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43460 samples/s/p 0:01:31 } +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1565/ 1625], loss: 1.098, per_step_time: 1471ms, lr: 1.0012462e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:48,629 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43697 samples/s/p 0:01:28 } +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1567/ 1625], loss: 1.051, per_step_time: 1471ms, lr: 1.0011634e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:51,579 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.6% |█████████████████████████████████████████████████ | 5.43638 samples/s/p 0:01:25 } +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1569/ 1625], loss: 1.271, per_step_time: 1472ms, lr: 1.0010881e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:54,530 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43464 samples/s/p 0:01:22 } +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1571/ 1625], loss: 1.089, per_step_time: 1471ms, lr: 1.001012e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:12:57,480 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43567 samples/s/p 0:01:19 } +2024-07-26 01:13:00,428 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1573/ 1625], loss: 1.181, per_step_time: 1470ms, lr: 1.0009412e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:00,429 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43924 samples/s/p 0:01:16 } +2024-07-26 01:13:03,381 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1575/ 1625], loss: 1.268, per_step_time: 1472ms, lr: 1.0008712e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:03,382 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43146 samples/s/p 0:01:13 } +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1577/ 1625], loss: 1.220, per_step_time: 1471ms, lr: 1.0008029e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:06,331 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43771 samples/s/p 0:01:10 } +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1579/ 1625], loss: 1.054, per_step_time: 1472ms, lr: 1.000738e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:09,282 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43380 samples/s/p 0:01:07 } +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1581/ 1625], loss: 1.135, per_step_time: 1471ms, lr: 1.0006768e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:12,233 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43499 samples/s/p 0:01:04 } +2024-07-26 01:13:15,184 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1583/ 1625], loss: 1.209, per_step_time: 1472ms, lr: 1.000618e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:15,185 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.7% |█████████████████████████████████████████████████ | 5.43299 samples/s/p 0:01:01 } +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1585/ 1625], loss: 1.182, per_step_time: 1470ms, lr: 1.0005626e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:18,133 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43988 samples/s/p 0:00:58 } +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1587/ 1625], loss: 1.129, per_step_time: 1473ms, lr: 1.0005091e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:21,086 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43070 samples/s/p 0:00:55 } +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1589/ 1625], loss: 1.180, per_step_time: 1470ms, lr: 1.000458e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:24,033 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.44179 samples/s/p 0:00:52 } +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1591/ 1625], loss: 1.177, per_step_time: 1471ms, lr: 1.0004088e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:26,983 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43528 samples/s/p 0:00:50 } +2024-07-26 01:13:29,933 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1593/ 1625], loss: 1.053, per_step_time: 1471ms, lr: 1.0003639e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:29,934 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43593 samples/s/p 0:00:47 } +2024-07-26 01:13:32,885 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1595/ 1625], loss: 1.081, per_step_time: 1472ms, lr: 1.0003206e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:32,886 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43280 samples/s/p 0:00:44 } +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1597/ 1625], loss: 1.085, per_step_time: 1471ms, lr: 1.0002809e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:35,836 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43484 samples/s/p 0:00:41 } +2024-07-26 01:13:38,786 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1599/ 1625], loss: 1.093, per_step_time: 1471ms, lr: 1.0002437e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:38,787 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.8% |█████████████████████████████████████████████████ | 5.43583 samples/s/p 0:00:38 } +2024-07-26 01:13:41,740 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1601/ 1625], loss: 1.187, per_step_time: 1473ms, lr: 1.0002083e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:41,741 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42860 samples/s/p 0:00:35 } +2024-07-26 01:13:44,690 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1603/ 1625], loss: 1.037, per_step_time: 1471ms, lr: 1.0001771e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:44,691 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43658 samples/s/p 0:00:32 } +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1605/ 1625], loss: 1.054, per_step_time: 1471ms, lr: 1.0001469e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:47,641 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43610 samples/s/p 0:00:29 } +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1607/ 1625], loss: 1.071, per_step_time: 1473ms, lr: 1.0001202e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:50,594 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43068 samples/s/p 0:00:26 } +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1609/ 1625], loss: 1.134, per_step_time: 1472ms, lr: 1.0000967e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:53,545 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43473 samples/s/p 0:00:23 } +2024-07-26 01:13:56,495 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1611/ 1625], loss: 1.194, per_step_time: 1471ms, lr: 1.0000743e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:56,496 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43518 samples/s/p 0:00:20 } +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1613/ 1625], loss: 1.232, per_step_time: 1472ms, lr: 1.0000579e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:13:59,447 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.43380 samples/s/p 0:00:17 } +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1615/ 1625], loss: 1.140, per_step_time: 1474ms, lr: 1.0000398e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:02,402 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 99.9% |█████████████████████████████████████████████████ | 5.42730 samples/s/p 0:00:14 } +2024-07-26 01:14:05,352 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1617/ 1625], loss: 0.922, per_step_time: 1471ms, lr: 1.0000276e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:05,353 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43574 samples/s/p 0:00:11 } +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1619/ 1625], loss: 1.218, per_step_time: 1472ms, lr: 1.0000164e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:08,304 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43327 samples/s/p 0:00:08 } +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1621/ 1625], loss: 1.082, per_step_time: 1473ms, lr: 1.0000086e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:11,258 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.42921 samples/s/p 0:00:05 } +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1623/ 1625], loss: 1.171, per_step_time: 1472ms, lr: 1.0000026e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:14,210 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |█████████████████████████████████████████████████ | 5.43232 samples/s/p 0:00:02 } +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:316] - INFO - { Epoch:[ 10/ 10], step:[ 1625/ 1625], loss: 1.078, per_step_time: 1473ms, lr: 1.0000009e-06, overflow cond: False, loss_scale: 1.0 +2024-07-26 01:14:17,163 - mindformers[mindformers/core/callback/callback.py:326] - INFO - 100.0% |██████████████████████████████████████████████████| 5.43097 samples/s/p 0:00:00 } +2024-07-26 01:14:17,208 - mindformers[mindformers/core/callback/callback.py:562] - INFO - ......Saving ckpt...... +2024-07-26 01:14:49,454 - mindformers[mindformers/trainer/base_trainer.py:779] - INFO - .........Training Over!............. diff --git "a/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204.docx" "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204.docx" new file mode 100644 index 00000000..92b23d55 Binary files /dev/null and "b/2024-ascend-innovation-contest/topic2-finetune/first-phase/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204/\346\257\224\345\245\207\345\240\241\345\206\262\346\265\252\345\260\217\347\273\204.docx" differ